-
Notifications
You must be signed in to change notification settings - Fork 2.8k
/
S3Objects.java
208 lines (177 loc) · 6.11 KB
/
S3Objects.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
/*
* Copyright 2012-2024 Amazon.com, Inc. or its affiliates. All Rights Reserved.
*
* Licensed under the Apache License, Version 2.0 (the "License").
* You may not use this file except in compliance with the License.
* A copy of the License is located at
*
* http://aws.amazon.com/apache2.0
*
* or in the "license" file accompanying this file. This file is distributed
* on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
* express or implied. See the License for the specific language governing
* permissions and limitations under the License.
*/
package com.amazonaws.services.s3.iterable;
import com.amazonaws.services.s3.AmazonS3;
import com.amazonaws.services.s3.model.ListObjectsRequest;
import com.amazonaws.services.s3.model.ObjectListing;
import com.amazonaws.services.s3.model.S3ObjectSummary;
import java.util.Iterator;
/**
* Provides an easy way to iterate Amazon S3 objects in a "foreach" statement.
* For example:
*
* <pre class="brush: java">
* for ( S3ObjectSummary summary : S3Objects.withPrefix(s3, "my-bucket", "photos/") ) {
* System.out.printf("Object with key '%s'\n", summary.getKey());
* }
* </pre>
* <p>
* The list of {@link S3ObjectSummary}s will be fetched lazily, a page at a
* time, as they are needed. The size of the page can be controlled with the
* {@link S3Objects#withBatchSize(int)} method.
*/
public class S3Objects implements Iterable<S3ObjectSummary> {
private AmazonS3 s3;
private String prefix = null;
private String bucketName;
private Integer batchSize = null;
private String delimiter;
private String marker;
private String encodingType;
private boolean requesterPays;
private S3Objects(AmazonS3 s3, String bucketName) {
this.s3 = s3;
this.bucketName = bucketName;
}
/**
* Constructs an iterable that covers all the objects in an Amazon S3
* bucket.
*
* @param s3
* The Amazon S3 client.
* @param bucketName
* The bucket name.
* @return An iterator for object summaries.
*/
public static S3Objects inBucket(AmazonS3 s3, String bucketName) {
return new S3Objects(s3, bucketName);
}
/**
* Constructs an iterable that covers the objects in an Amazon S3 bucket
* where the key begins with the given prefix.
*
* @param s3
* The Amazon S3 client.
* @param bucketName
* The bucket name.
* @param prefix
* The prefix.
* @return An iterator for object summaries.
*/
public static S3Objects withPrefix(AmazonS3 s3, String bucketName, String prefix) {
S3Objects objects = new S3Objects(s3, bucketName);
objects.prefix = prefix;
return objects;
}
/**
* Sets the batch size, i.e., how many {@link S3ObjectSummary}s will be
* fetched at once.
*
* @param batchSize
* How many object summaries to fetch at once.
*/
public S3Objects withBatchSize(int batchSize) {
this.batchSize = batchSize;
return this;
}
/**
* @see ListObjectsRequest#withRequesterPays(boolean)
*/
public void withRequesterPays(boolean requesterPays) {
this.requesterPays = requesterPays;
}
/**
* @see ListObjectsRequest#withEncodingType(String)
*/
public void withEncodingType(String encodingType) {
this.encodingType = encodingType;
}
/**
* @see ListObjectsRequest#withMarker(String)
*/
public void withMarker(String marker) {
this.marker = marker;
}
/**
* @see ListObjectsRequest#withDelimiter(String)
*/
public void withDelimiter(String delimiter) {
this.delimiter = delimiter;
}
public Integer getBatchSize() {
return batchSize;
}
public String getPrefix() {
return prefix;
}
public String getBucketName() {
return bucketName;
}
public String getDelimiter() {
return delimiter;
}
public String getMarker() {
return marker;
}
public String getEncodingType() {
return encodingType;
}
public boolean isRequesterPays() {
return requesterPays;
}
public AmazonS3 getS3() {
return s3;
}
private class S3ObjectIterator implements Iterator<S3ObjectSummary> {
private ObjectListing currentListing = null;
private Iterator<S3ObjectSummary> currentIterator = null;
@Override
public boolean hasNext() {
prepareCurrentListing();
return currentIterator.hasNext();
}
@Override
public S3ObjectSummary next() {
prepareCurrentListing();
return currentIterator.next();
}
@Override
public void remove() {
throw new UnsupportedOperationException();
}
private void prepareCurrentListing() {
while (currentListing == null || (!currentIterator.hasNext() && currentListing.isTruncated())) {
if (currentListing == null) {
ListObjectsRequest req = new ListObjectsRequest();
req.setBucketName(getBucketName());
req.setPrefix(getPrefix());
req.setMaxKeys(getBatchSize());
req.setDelimiter(getDelimiter());
req.setMarker(getMarker());
req.setEncodingType(getEncodingType());
req.setRequesterPays(isRequesterPays());
currentListing = getS3().listObjects(req);
} else {
currentListing = getS3().listNextBatchOfObjects(currentListing);
}
currentIterator = currentListing.getObjectSummaries().iterator();
}
}
}
@Override
public Iterator<S3ObjectSummary> iterator() {
return new S3ObjectIterator();
}
}