initial stage
This commit is contained in:
parent
541581c8b2
commit
b3a9ad8342
|
@ -0,0 +1,45 @@
|
|||
import os
|
||||
from datetime import timedelta
|
||||
|
||||
import pendulum
|
||||
import requests
|
||||
from airflow.decorators import dag
|
||||
from airflow.decorators import task
|
||||
from airflow.providers.amazon.aws.hooks.s3 import S3Hook
|
||||
from airflow.providers.amazon.aws.transfers.http_to_s3 import HttpToS3Operator
|
||||
|
||||
from common import s3_dowload_unzip_upload
|
||||
|
||||
S3_CONN_ID = os.getenv("S3_CONN_ID", "s3_conn")
|
||||
EXECUTION_TIMEOUT = int(os.getenv("EXECUTION_TIMEOUT", 6))
|
||||
|
||||
default_args = {
|
||||
"execution_timeout": timedelta(hours=EXECUTION_TIMEOUT),
|
||||
"retries": int(os.getenv("DEFAULT_TASK_RETRIES", 1)),
|
||||
"retry_delay": timedelta(seconds=int(os.getenv("DEFAULT_RETRY_DELAY_SECONDS", 60))),
|
||||
}
|
||||
|
||||
|
||||
@dag(
|
||||
start_date=pendulum.datetime(2021, 1, 1, tz="UTC"),
|
||||
schedule=None,
|
||||
catchup=False,
|
||||
default_args=default_args,
|
||||
params={
|
||||
"file": "File to download",
|
||||
"dst_bucket": "bucket that will contain file"
|
||||
},
|
||||
tags=["s3"],
|
||||
)
|
||||
def openaire_to_s3(**context):
|
||||
return HttpToS3Operator(
|
||||
task_id="http_to_s3_task",
|
||||
http_conn_id="openaire_conn",
|
||||
endpoint="/data/graph/" + context["params"]["file"],
|
||||
s3_conn_id=S3_CONN_ID,
|
||||
s3_bucket=context["params"]["dst_bucket"],
|
||||
s3_key="/data/graph/" + context["params"]["file"],
|
||||
replace=True,
|
||||
)
|
||||
|
||||
openaire_to_s3()
|
Loading…
Reference in New Issue