|
| 1 | +# Copyright 2021 Google LLC |
| 2 | +# |
| 3 | +# Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | +# you may not use this file except in compliance with the License. |
| 5 | +# You may obtain a copy of the License at |
| 6 | +# |
| 7 | +# http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | +# |
| 9 | +# Unless required by applicable law or agreed to in writing, software |
| 10 | +# distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | +# See the License for the specific language governing permissions and |
| 13 | +# limitations under the License. |
| 14 | + |
| 15 | + |
| 16 | +from airflow import DAG |
| 17 | +from airflow.operators import bash |
| 18 | + |
| 19 | +default_args = { |
| 20 | + "owner": "Google", |
| 21 | + "depends_on_past": False, |
| 22 | + "start_date": "2022-06-10", |
| 23 | +} |
| 24 | + |
| 25 | + |
| 26 | +with DAG( |
| 27 | + dag_id="fashion_mnist.fashion_mnist", |
| 28 | + default_args=default_args, |
| 29 | + max_active_runs=1, |
| 30 | + schedule_interval="@weekly", |
| 31 | + catchup=False, |
| 32 | + default_view="graph", |
| 33 | +) as dag: |
| 34 | + |
| 35 | + # Task to copy `fashion-mnist.gz` from FASHION MNIST Database to GCS |
| 36 | + download_zip_files = bash.BashOperator( |
| 37 | + task_id="download_zip_files", |
| 38 | + bash_command="mkdir -p $data_dir/fashion-mnist\ncurl -o $data_dir/fashion-mnist/t10k-images-idx3-ubyte.gz -L $fashion_mnist_test\ncurl -o $data_dir/fashion-mnist/train-images-idx3-ubyte.gz -L $fashion_mnist_train\ncurl -o $data_dir/fashion-mnist/train-labels-idx1-ubyte.gz -L $fashion_mnist_train_labels\ncurl -o $data_dir/fashion-mnist/t10k-labels-idx1-ubyte.gz -L $fashion_mnist_test_labels\n", |
| 39 | + env={ |
| 40 | + "data_dir": "/home/airflow/gcs/data/fashion-mnist", |
| 41 | + "fashion_mnist_test": "http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz", |
| 42 | + "fashion_mnist_train": "http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz", |
| 43 | + "fashion_mnist_train_labels": "http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz", |
| 44 | + "fashion_mnist_test_labels": "http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz", |
| 45 | + }, |
| 46 | + ) |
| 47 | + |
| 48 | + download_zip_files |
0 commit comments