Source code for diff_classifier.aws

"""IO functions for downloading and uploading files from AWS S3 buckets.

The diff_classifier module was built to be used with conjunction with AWS
services. With the exception of Cloudknot parallelization capabilities, most
functions can be used separate from AWS. These functions faciliate interaction
with files stores in S3 buckets. Users must have appropriate credentials to
access desired S3 buckets.

"""
import os
import os.path as op

import boto3


# import diff_classifier.imagej as ij


[docs]def download_s3(remote_fname, local_fname, bucket_name="ccurtis.data"): """Download a file from S3 to local file-system Parameters ---------- remote_fname: string Name of remote file in S3 bucket. local_fname: string Desired name to be stored on local computer. bucket_name: string Bucket name on S3. """ if not os.path.exists(local_fname): sthree = boto3.resource('s3') buckt = sthree.Bucket(bucket_name) buckt.download_file(remote_fname, local_fname)
[docs]def upload_s3(local_fname, remote_fname, bucket_name="ccurtis.data"): """ Upload a file from local file-system to S3. Parameters ---------- local_fname: string Name of local file stored on computer. remote_fname: string Desired name to be stored in S3 bucket. bucket_name: string Bucket name on S3. """ sthree = boto3.resource('s3') buckt = sthree.Bucket(bucket_name) buckt.upload_file(local_fname, remote_fname)
# def partition_and_store(remote_fname, local_dir, bucket_name="ccurtis7.pup"): # """ # Download image from S3, partition, and upload partitions to S3. # Parameters # ---------- # remote_fname: string # Target filename in S3 bucket. # local_dir: string # Local directory to store downloaded file. # bucket_name: string # Bucket name on S3. # Returns # ------- # remote_names: list of strings. # Names of partitioned images in S3. # """ # remote_dir, remote_file = op.split(remote_fname) # download_s3(remote_fname, op.join(local_dir, remote_file)) # names = ij.partition_im(op.join(local_dir, remote_file)) # remote_names = [] # for file in names: # local_file = op.split(file)[1] # upload_s3(op.join(local_dir, local_file), op.join(remote_dir, local_file)) # remote_names.append(op.join(remote_dir, local_file)) # return remote_names