Skip to content

Commit 321a6cc

Browse files
authored
HADOOP-19072. S3A: expand optimisations on stores with "fs.s3a.performance.flags" for mkdir (apache#6543)
If the flag list in fs.s3a.performance.flags includes "mkdir" then the safety check of a walk up the tree to look for a parent directory, -done to verify a directory isn't being created under a file- are skipped. This saves the cost of multiple list operations. Contributed by Viraj Jasani
1 parent 2a50911 commit 321a6cc

File tree

10 files changed

+265
-34
lines changed

10 files changed

+265
-34
lines changed

hadoop-common-project/hadoop-common/src/site/markdown/filesystem/fsdataoutputstreambuilder.md

+2-2
Original file line numberDiff line numberDiff line change
@@ -200,8 +200,8 @@ Prioritize file creation performance over safety checks for filesystem consisten
200200
This:
201201
1. Skips the `LIST` call which makes sure a file is being created over a directory.
202202
Risk: a file is created over a directory.
203-
1. Ignores the overwrite flag.
204-
1. Never issues a `DELETE` call to delete parent directory markers.
203+
2. Ignores the overwrite flag.
204+
3. Never issues a `DELETE` call to delete parent directory markers.
205205

206206
It is possible to probe an S3A Filesystem instance for this capability through
207207
the `hasPathCapability(path, "fs.s3a.create.performance")` check.

hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/fs/FileContextCreateMkdirBaseTest.java

+12-9
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@
2727
import static org.apache.hadoop.fs.FileContextTestHelper.*;
2828
import static org.apache.hadoop.fs.contract.ContractTestUtils.assertIsDirectory;
2929
import static org.apache.hadoop.fs.contract.ContractTestUtils.assertIsFile;
30+
import static org.apache.hadoop.test.LambdaTestUtils.intercept;
3031

3132
import org.apache.hadoop.test.GenericTestUtils;
3233
import org.slf4j.event.Level;
@@ -55,7 +56,10 @@ public abstract class FileContextCreateMkdirBaseTest {
5556

5657
protected final FileContextTestHelper fileContextTestHelper;
5758
protected static FileContext fc;
58-
59+
60+
public static final String MKDIR_FILE_PRESENT_ERROR =
61+
" should have failed as a file was present";
62+
5963
static {
6064
GenericTestUtils.setLogLevel(FileSystem.LOG, Level.DEBUG);
6165
}
@@ -128,7 +132,7 @@ public void testMkdirsRecursiveWithExistingDir() throws IOException {
128132
}
129133

130134
@Test
131-
public void testMkdirRecursiveWithExistingFile() throws IOException {
135+
public void testMkdirRecursiveWithExistingFile() throws Exception {
132136
Path f = getTestRootPath(fc, "NonExistant3/aDir");
133137
fc.mkdir(f, FileContext.DEFAULT_PERM, true);
134138
assertIsDirectory(fc.getFileStatus(f));
@@ -141,13 +145,12 @@ public void testMkdirRecursiveWithExistingFile() throws IOException {
141145

142146
// try creating another folder which conflicts with filePath
143147
Path dirPath = new Path(filePath, "bDir/cDir");
144-
try {
145-
fc.mkdir(dirPath, FileContext.DEFAULT_PERM, true);
146-
Assert.fail("Mkdir for " + dirPath
147-
+ " should have failed as a file was present");
148-
} catch(IOException e) {
149-
// failed as expected
150-
}
148+
intercept(
149+
IOException.class,
150+
null,
151+
"Mkdir for " + dirPath + MKDIR_FILE_PRESENT_ERROR,
152+
() -> fc.mkdir(dirPath, FileContext.DEFAULT_PERM, true)
153+
);
151154
}
152155

153156
@Test

hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/fs/contract/AbstractContractMkdirTest.java

+5-2
Original file line numberDiff line numberDiff line change
@@ -35,6 +35,9 @@
3535
*/
3636
public abstract class AbstractContractMkdirTest extends AbstractFSContractTestBase {
3737

38+
public static final String MKDIRS_NOT_FAILED_OVER_FILE =
39+
"mkdirs did not fail over a file but returned ";
40+
3841
@Test
3942
public void testMkDirRmDir() throws Throwable {
4043
FileSystem fs = getFileSystem();
@@ -66,7 +69,7 @@ public void testNoMkdirOverFile() throws Throwable {
6669
createFile(getFileSystem(), path, false, dataset);
6770
try {
6871
boolean made = fs.mkdirs(path);
69-
fail("mkdirs did not fail over a file but returned " + made
72+
fail(MKDIRS_NOT_FAILED_OVER_FILE + made
7073
+ "; " + ls(path));
7174
} catch (ParentNotDirectoryException | FileAlreadyExistsException e) {
7275
//parent is a directory
@@ -93,7 +96,7 @@ public void testMkdirOverParentFile() throws Throwable {
9396
Path child = new Path(path,"child-to-mkdir");
9497
try {
9598
boolean made = fs.mkdirs(child);
96-
fail("mkdirs did not fail over a file but returned " + made
99+
fail(MKDIRS_NOT_FAILED_OVER_FILE + made
97100
+ "; " + ls(path));
98101
} catch (ParentNotDirectoryException | FileAlreadyExistsException e) {
99102
//parent is a directory

hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AFileSystem.java

+5-2
Original file line numberDiff line numberDiff line change
@@ -3828,7 +3828,8 @@ public boolean mkdirs(Path p, FsPermission permission) throws IOException,
38283828
createStoreContext(),
38293829
path,
38303830
createMkdirOperationCallbacks(),
3831-
isMagicCommitPath(path)));
3831+
isMagicCommitPath(path),
3832+
performanceFlags.enabled(PerformanceFlagEnum.Mkdir)));
38323833
}
38333834

38343835
/**
@@ -4281,7 +4282,9 @@ public boolean createEmptyDir(Path path, StoreContext storeContext)
42814282
new MkdirOperation(
42824283
storeContext,
42834284
path,
4284-
createMkdirOperationCallbacks(), false));
4285+
createMkdirOperationCallbacks(),
4286+
false,
4287+
performanceFlags.enabled(PerformanceFlagEnum.Mkdir)));
42854288
}
42864289
}
42874290

hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/impl/MkdirOperation.java

+61-16
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,8 @@
2626
import org.slf4j.Logger;
2727
import org.slf4j.LoggerFactory;
2828

29+
import org.apache.hadoop.classification.InterfaceAudience;
30+
import org.apache.hadoop.classification.InterfaceStability;
2931
import org.apache.hadoop.fs.FileAlreadyExistsException;
3032
import org.apache.hadoop.fs.FileStatus;
3133
import org.apache.hadoop.fs.Path;
@@ -54,30 +56,54 @@
5456
* <li>If needed, one PUT</li>
5557
* </ol>
5658
*/
59+
@InterfaceAudience.Private
60+
@InterfaceStability.Evolving
5761
public class MkdirOperation extends ExecutingStoreOperation<Boolean> {
5862

5963
private static final Logger LOG = LoggerFactory.getLogger(
6064
MkdirOperation.class);
6165

66+
/**
67+
* Path of the directory to be created.
68+
*/
6269
private final Path dir;
6370

71+
/**
72+
* Mkdir Callbacks object to be used by the Mkdir operation.
73+
*/
6474
private final MkdirCallbacks callbacks;
6575

6676
/**
67-
* Should checks for ancestors existing be skipped?
68-
* This flag is set when working with magic directories.
77+
* Whether to skip the validation of the parent directory.
78+
*/
79+
private final boolean performanceMkdir;
80+
81+
/**
82+
* Whether the path is magic commit path.
6983
*/
7084
private final boolean isMagicPath;
7185

86+
/**
87+
* Initialize Mkdir Operation context for S3A.
88+
*
89+
* @param storeContext Store context.
90+
* @param dir Dir path of the directory.
91+
* @param callbacks MkdirCallbacks object used by the Mkdir operation.
92+
* @param isMagicPath True if the path is magic commit path.
93+
* @param performanceMkdir If true, skip validation of the parent directory
94+
* structure.
95+
*/
7296
public MkdirOperation(
7397
final StoreContext storeContext,
7498
final Path dir,
7599
final MkdirCallbacks callbacks,
76-
final boolean isMagicPath) {
100+
final boolean isMagicPath,
101+
final boolean performanceMkdir) {
77102
super(storeContext);
78103
this.dir = dir;
79104
this.callbacks = callbacks;
80105
this.isMagicPath = isMagicPath;
106+
this.performanceMkdir = performanceMkdir;
81107
}
82108

83109
/**
@@ -124,7 +150,32 @@ public Boolean execute() throws IOException {
124150
return true;
125151
}
126152

127-
// Walk path to root, ensuring closest ancestor is a directory, not file
153+
// if performance creation mode is set, no need to check
154+
// whether the closest ancestor is dir.
155+
if (!performanceMkdir) {
156+
verifyFileStatusOfClosestAncestor();
157+
}
158+
159+
// if we get here there is no directory at the destination.
160+
// so create one.
161+
162+
// Create the marker file, delete the parent entries
163+
// if the filesystem isn't configured to retain them
164+
callbacks.createFakeDirectory(dir, false);
165+
return true;
166+
}
167+
168+
/**
169+
* Verify the file status of the closest ancestor, if it is
170+
* dir, the mkdir operation should proceed. If it is file,
171+
* the mkdir operation should throw error.
172+
*
173+
* @throws IOException If either file status could not be retrieved,
174+
* or if the closest ancestor is a file.
175+
*/
176+
private void verifyFileStatusOfClosestAncestor() throws IOException {
177+
FileStatus fileStatus;
178+
// Walk path to root, ensuring the closest ancestor is a directory, not file
128179
Path fPart = dir.getParent();
129180
try {
130181
while (fPart != null && !fPart.isRoot()) {
@@ -140,24 +191,18 @@ public Boolean execute() throws IOException {
140191
}
141192

142193
// there's a file at the parent entry
143-
throw new FileAlreadyExistsException(String.format(
144-
"Can't make directory for path '%s' since it is a file.",
145-
fPart));
194+
throw new FileAlreadyExistsException(
195+
String.format(
196+
"Can't make directory for path '%s' since it is a file.",
197+
fPart));
146198
}
147199
} catch (AccessDeniedException e) {
148200
LOG.info("mkdirs({}}: Access denied when looking"
149201
+ " for parent directory {}; skipping checks",
150-
dir, fPart);
202+
dir,
203+
fPart);
151204
LOG.debug("{}", e, e);
152205
}
153-
154-
// if we get here there is no directory at the destination.
155-
// so create one.
156-
157-
// Create the marker file, delete the parent entries
158-
// if the filesystem isn't configured to retain them
159-
callbacks.createFakeDirectory(dir, false);
160-
return true;
161206
}
162207

163208
/**

hadoop-tools/hadoop-aws/src/site/markdown/tools/hadoop-aws/performance.md

+20-1
Original file line numberDiff line numberDiff line change
@@ -299,8 +299,11 @@ understands the risks.
299299
| *Option* | *Meaning* | Since |
300300
|----------|--------------------|:------|
301301
| `create` | Create Performance | 3.4.1 |
302+
| `mkdir` | Mkdir Performance | 3.4.1 |
302303

303-
The `create` flag has the same semantics as [`fs.s3a.create.performance`](#create-performance)
304+
305+
* The `create` flag has the same semantics as [`fs.s3a.create.performance`](#create-performance)
306+
* The `mkdir` flag semantics are explained in [Mkdir Performance](#mkdir-performance)
304307

305308

306309
### <a name="create-performance"></a> Create Performance `fs.s3a.create.performance`
@@ -321,6 +324,22 @@ It may however result in
321324

322325
Use with care, and, ideally, enable versioning on the S3 store.
323326

327+
328+
### <a name="mkdir-performance"></a> Mkdir Performance
329+
330+
`fs.s3a.performance.flag` flag option `mkdir`:
331+
332+
* Mkdir does not check whether the parent is directory or file.
333+
334+
This avoids the verification of the file status of the parent file
335+
or the closest ancestor. Unlike the default mkdir operation, if the
336+
parent is not a directory, the mkdir operation does not throw any
337+
error.
338+
339+
This option can help with mkdir performance improvement but must be used
340+
only if the person setting them understands the above-mentioned risk.
341+
342+
324343
### <a name="threads"></a> Thread and connection pool settings.
325344

326345
Each S3A client interacting with a single bucket, as a single user, has its

hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/contract/s3a/ITestS3AContractMkdir.java

+11
Original file line numberDiff line numberDiff line change
@@ -22,11 +22,22 @@
2222
import org.apache.hadoop.fs.contract.AbstractContractMkdirTest;
2323
import org.apache.hadoop.fs.contract.AbstractFSContract;
2424

25+
import static org.apache.hadoop.fs.s3a.Constants.FS_S3A_CREATE_PERFORMANCE;
26+
import static org.apache.hadoop.fs.s3a.S3ATestUtils.removeBaseAndBucketOverrides;
27+
2528
/**
2629
* Test dir operations on S3A.
2730
*/
2831
public class ITestS3AContractMkdir extends AbstractContractMkdirTest {
2932

33+
@Override
34+
protected Configuration createConfiguration() {
35+
Configuration conf = super.createConfiguration();
36+
removeBaseAndBucketOverrides(conf,
37+
FS_S3A_CREATE_PERFORMANCE);
38+
return conf;
39+
}
40+
3041
@Override
3142
protected AbstractFSContract createContract(Configuration conf) {
3243
return new S3AContract(conf);
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,75 @@
1+
/*
2+
* Licensed to the Apache Software Foundation (ASF) under one
3+
* or more contributor license agreements. See the NOTICE file
4+
* distributed with this work for additional information
5+
* regarding copyright ownership. The ASF licenses this file
6+
* to you under the Apache License, Version 2.0 (the
7+
* "License"); you may not use this file except in compliance
8+
* with the License. You may obtain a copy of the License at
9+
*
10+
* http://www.apache.org/licenses/LICENSE-2.0
11+
*
12+
* Unless required by applicable law or agreed to in writing, software
13+
* distributed under the License is distributed on an "AS IS" BASIS,
14+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15+
* See the License for the specific language governing permissions and
16+
* limitations under the License.
17+
*/
18+
19+
package org.apache.hadoop.fs.contract.s3a;
20+
21+
import org.junit.Test;
22+
23+
import org.apache.hadoop.conf.Configuration;
24+
import org.apache.hadoop.fs.FileSystem;
25+
import org.apache.hadoop.fs.Path;
26+
import org.apache.hadoop.fs.contract.AbstractContractMkdirTest;
27+
import org.apache.hadoop.fs.contract.AbstractFSContract;
28+
import org.apache.hadoop.fs.contract.ContractTestUtils;
29+
30+
import static org.apache.hadoop.fs.contract.ContractTestUtils.createFile;
31+
import static org.apache.hadoop.fs.contract.ContractTestUtils.dataset;
32+
import static org.apache.hadoop.fs.s3a.Constants.FS_S3A_CREATE_PERFORMANCE;
33+
import static org.apache.hadoop.fs.s3a.Constants.FS_S3A_PERFORMANCE_FLAGS;
34+
import static org.apache.hadoop.fs.s3a.S3ATestUtils.removeBaseAndBucketOverrides;
35+
36+
/**
37+
* Test mkdir operations on S3A with create performance mode.
38+
*/
39+
public class ITestS3AContractMkdirWithCreatePerf extends AbstractContractMkdirTest {
40+
41+
@Override
42+
protected Configuration createConfiguration() {
43+
Configuration conf = super.createConfiguration();
44+
removeBaseAndBucketOverrides(
45+
conf,
46+
FS_S3A_CREATE_PERFORMANCE,
47+
FS_S3A_PERFORMANCE_FLAGS);
48+
conf.setStrings(FS_S3A_PERFORMANCE_FLAGS,
49+
"create,mkdir");
50+
return conf;
51+
}
52+
53+
@Override
54+
protected AbstractFSContract createContract(Configuration conf) {
55+
return new S3AContract(conf);
56+
}
57+
58+
@Test
59+
public void testMkdirOverParentFile() throws Throwable {
60+
describe("try to mkdir where a parent is a file, should pass");
61+
FileSystem fs = getFileSystem();
62+
Path path = methodPath();
63+
byte[] dataset = dataset(1024, ' ', 'z');
64+
createFile(getFileSystem(), path, false, dataset);
65+
Path child = new Path(path, "child-to-mkdir");
66+
boolean childCreated = fs.mkdirs(child);
67+
assertTrue("Child dir is created", childCreated);
68+
assertIsFile(path);
69+
byte[] bytes = ContractTestUtils.readDataset(getFileSystem(), path, dataset.length);
70+
ContractTestUtils.compareByteArrays(dataset, bytes, dataset.length);
71+
assertPathExists("mkdir failed", child);
72+
assertDeleted(child, true);
73+
}
74+
75+
}

0 commit comments

Comments
 (0)