1#!/usr/bin/env python 2# Copyright 2014 The Chromium Authors. All rights reserved. 3# Use of this source code is governed by a BSD-style license that can be 4# found in the LICENSE file. 5 6import argparse 7import logging 8import os 9import subprocess 10import sys 11 12from telemetry.core import util 13from telemetry.internal.util import command_line 14 15sys.path.insert(1, os.path.abspath(os.path.join( 16 util.GetCatapultDir(), 'catapult_base'))) 17from catapult_base import cloud_storage 18 19 20BUCKETS = {bucket: easy_bucket_name for easy_bucket_name, bucket 21 in cloud_storage.BUCKET_ALIASES.iteritems()} 22 23 24def _GetPaths(path): 25 root, ext = os.path.splitext(path) 26 if ext == '.sha1': 27 file_path = root 28 hash_path = path 29 else: 30 file_path = path 31 hash_path = path + '.sha1' 32 return file_path, hash_path 33 34 35def _FindFilesInCloudStorage(files): 36 """Returns a dict of all files and which buckets they're in.""" 37 # Preprocessing: get the contents of all buckets. 38 bucket_contents = {} 39 for bucket in BUCKETS: 40 try: 41 bucket_contents[bucket] = cloud_storage.List(bucket) 42 except (cloud_storage.PermissionError, cloud_storage.CredentialsError): 43 pass 44 45 # Check if each file is in the bucket contents. 46 file_buckets = {} 47 for path in files: 48 file_path, hash_path = _GetPaths(path) 49 50 if file_path in file_buckets: 51 # Ignore duplicates, if both data and sha1 file were in the file list. 52 continue 53 if not os.path.exists(hash_path): 54 # Probably got some non-Cloud Storage files in the file list. Ignore. 55 continue 56 57 file_hash = cloud_storage.ReadHash(hash_path) 58 file_buckets[file_path] = [] 59 for bucket in BUCKETS: 60 if bucket in bucket_contents and file_hash in bucket_contents[bucket]: 61 file_buckets[file_path].append(bucket) 62 63 return file_buckets 64 65 66class Ls(command_line.Command): 67 """List which bucket each file is in.""" 68 69 @classmethod 70 def AddCommandLineArgs(cls, parser): 71 parser.add_argument('-r', '--recursive', action='store_true') 72 parser.add_argument('paths', nargs='+') 73 74 @classmethod 75 def ProcessCommandLineArgs(cls, parser, args): 76 for path in args.paths: 77 if not os.path.exists(path): 78 parser.error('Path not found: %s' % path) 79 80 def Run(self, args): 81 def GetFilesInPaths(paths, recursive): 82 """If path is a dir, yields all files in path, otherwise just yields path. 83 If recursive is true, walks subdirectories recursively.""" 84 for path in paths: 85 if not os.path.isdir(path): 86 yield path 87 continue 88 89 if recursive: 90 for root, _, filenames in os.walk(path): 91 for filename in filenames: 92 yield os.path.join(root, filename) 93 else: 94 for filename in os.listdir(path): 95 yield os.path.join(path, filename) 96 97 files = _FindFilesInCloudStorage(GetFilesInPaths(args.paths, args.recursive)) 98 99 if not files: 100 print 'No files in Cloud Storage.' 101 return 102 103 for file_path, buckets in sorted(files.iteritems()): 104 if buckets: 105 buckets = [BUCKETS[bucket] for bucket in buckets] 106 print '%-11s %s' % (','.join(buckets), file_path) 107 else: 108 print '%-11s %s' % ('not found', file_path) 109 110 111class Mv(command_line.Command): 112 """Move files to the given bucket.""" 113 114 @classmethod 115 def AddCommandLineArgs(cls, parser): 116 parser.add_argument('files', nargs='+') 117 parser.add_argument('bucket', choices=cloud_storage.BUCKET_ALIASES) 118 119 @classmethod 120 def ProcessCommandLineArgs(cls, parser, args): 121 args.bucket = cloud_storage.BUCKET_ALIASES[args.bucket] 122 123 def Run(self, args): 124 files = _FindFilesInCloudStorage(args.files) 125 126 for file_path, buckets in sorted(files.iteritems()): 127 if not buckets: 128 raise IOError('%s not found in Cloud Storage.' % file_path) 129 130 for file_path, buckets in sorted(files.iteritems()): 131 if args.bucket in buckets: 132 buckets.remove(args.bucket) 133 if not buckets: 134 logging.info('Skipping %s, no action needed.' % file_path) 135 continue 136 137 # Move to the target bucket. 138 file_hash = cloud_storage.ReadHash(file_path + '.sha1') 139 cloud_storage.Move(buckets.pop(), args.bucket, file_hash) 140 141 # Delete all additional copies. 142 for bucket in buckets: 143 cloud_storage.Delete(bucket, file_hash) 144 145 146class Rm(command_line.Command): 147 """Remove files from Cloud Storage.""" 148 149 @classmethod 150 def AddCommandLineArgs(cls, parser): 151 parser.add_argument('files', nargs='+') 152 153 def Run(self, args): 154 files = _FindFilesInCloudStorage(args.files) 155 for file_path, buckets in sorted(files.iteritems()): 156 file_hash = cloud_storage.ReadHash(file_path + '.sha1') 157 for bucket in buckets: 158 cloud_storage.Delete(bucket, file_hash) 159 160 161class Upload(command_line.Command): 162 """Upload files to Cloud Storage.""" 163 164 @classmethod 165 def AddCommandLineArgs(cls, parser): 166 parser.add_argument('files', nargs='+') 167 parser.add_argument('bucket', choices=cloud_storage.BUCKET_ALIASES) 168 169 @classmethod 170 def ProcessCommandLineArgs(cls, parser, args): 171 args.bucket = cloud_storage.BUCKET_ALIASES[args.bucket] 172 173 for path in args.files: 174 if not os.path.exists(path): 175 parser.error('File not found: %s' % path) 176 177 def Run(self, args): 178 for file_path in args.files: 179 file_hash = cloud_storage.CalculateHash(file_path) 180 181 # Create or update the hash file. 182 hash_path = file_path + '.sha1' 183 with open(hash_path, 'wb') as f: 184 f.write(file_hash) 185 f.flush() 186 187 # Add the data to Cloud Storage. 188 cloud_storage.Insert(args.bucket, file_hash, file_path) 189 190 # Add the hash file to the branch, for convenience. :) 191 subprocess.call(['git', 'add', hash_path]) 192 193 194class CloudStorageCommand(command_line.SubcommandCommand): 195 commands = (Ls, Mv, Rm, Upload) 196 197 198if __name__ == '__main__': 199 logging.getLogger().setLevel(logging.INFO) 200 sys.exit(CloudStorageCommand.main()) 201