Context Navigation

← Previous Changeset
Next Changeset →

Changeset 257134 in webkit

Timestamp:

Feb 21, 2020, 8:20:55 AM (5 years ago)

Author:

mark.lam@apple.com

Message:

Make support for bytecode caching more robust against file corruption.
https://bugs.webkit.org/show_bug.cgi?id=207972
<rdar://problem/59260595>

Reviewed by Yusuke Suzuki.

If a bytecode cache file is corrupted, we currently will always crash every time
we try to read it (in perpetuity as long as the corrupted cache file continues to
exist on disk). To guard against this, we'll harden the bytecode caching mechanism
as follows:

Modify the writeCache operation to always write the cache file in a transactional manner i.e. we'll first write to a .tmp file, and then rename the .tmp file to the cache file only if the entire file has been written in completeness.

This ensures that we won't get corrupted cache files due to interrupted writes.

Modify the writeCache operation to also compute a SHA1 hash of the cache file and append the hash at end of the file. Modify the readCache operation to first authenticate the SHA1 hash before allowing the cache file to be used. If the hash does not match, the file is bad, and we'll just delete it.

This ensures that we won't be crashing while decoding a corrupted cache file.

Manually tested with the following scenarios and ensuring that the client recovers
with no crashes:

no cache file on disk.
a 0-sized cache file on a disk.
a truncated cache file on disk.
a corrupted cache file on disk.
an uncorrupted cache file on disk.

Also added some static_asserts in CachedTypes.cpp to document some invariants that
the pre-existing code is dependent on.

API/JSScript.mm:

(-[JSScript readCache]):
(-[JSScript writeCache:]):

runtime/CachedTypes.cpp:

Location:

trunk/Source/JavaScriptCore

Files:

: 3 edited

API/JSScript.mm (modified) (8 diffs)
ChangeLog (modified) (1 diff)
runtime/CachedTypes.cpp (modified) (3 diffs)

Legend:

: Unmodified
: Added
: Removed

trunk/Source/JavaScriptCore/API/JSScript.mm

-              r254152
+              r257134
 /*
  * Copyright (C) 2019 Apple Inc. All rights reserved.
+ * Copyright (C) 2019-2020 Apple Inc. All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
 …
 #import <wtf/FileMetadata.h>
 #import <wtf/FileSystem.h>
+#import <wtf/SHA1.h>
 #import <wtf/Scope.h>
 #import <wtf/WeakObjCPtr.h>
 …
         return;
+    auto fd = FileSystem::openAndLockFile([m_cachePath path].UTF8String, FileSystem::FileOpenMode::Read, {FileSystem::FileLockMode::Exclusive, FileSystem::FileLockMode::Nonblocking});
+    NSString *cachePathString = [m_cachePath path];
+    const char* cacheFilename = cachePathString.UTF8String;
+    auto fd = FileSystem::openAndLockFile(cacheFilename, FileSystem::FileOpenMode::Read, {FileSystem::FileLockMode::Exclusive, FileSystem::FileLockMode::Nonblocking});
     if (!FileSystem::isHandleValid(fd))
         return;
 …
     if (!success)
         return;
+    const uint8_t* fileData = reinterpret_cast<const uint8_t*>(mappedFile.data());
+    unsigned fileTotalSize = mappedFile.size();
+    // Ensure we at least have a SHA1::Digest to read.
+    if (fileTotalSize < sizeof(SHA1::Digest)) {
+        FileSystem::deleteFile(cacheFilename);
+        return;
+    }
+    unsigned fileDataSize = fileTotalSize - sizeof(SHA1::Digest);
+    SHA1::Digest computedHash;
+    SHA1 sha1;
+    sha1.addBytes(fileData, fileDataSize);
+    sha1.computeHash(computedHash);
+    SHA1::Digest fileHash;
+    memcpy(&fileHash, fileData + fileDataSize, sizeof(SHA1::Digest));
+    if (computedHash != fileHash) {
+        FileSystem::deleteFile(cacheFilename);
+        return;
+    }
     Ref<JSC::CachedBytecode> cachedBytecode = JSC::CachedBytecode::create(WTFMove(mappedFile));
 …
         m_cachedBytecode = WTFMove(cachedBytecode);
     else
         ftruncate(fd, 0);
+        FileSystem::truncateFile(fd, 0);
+}
 …
+    }
+    int fd = open([m_cachePath path].UTF8String, O_CREAT | O_RDWR | O_EXLOCK | O_NONBLOCK, 0666);
+    // We want to do the write as a transaction (i.e. we guarantee that it's all
+    // or nothing). So, we'll write to a temp file first, and rename the temp
+    // file to the cache file only after we've finished writing the whole thing.
+    NSString *cachePathString = [m_cachePath path];
+    const char* cacheFileName = cachePathString.UTF8String;
+    const char* tempFileName = [cachePathString stringByAppendingString:@".tmp"].UTF8String;
+    int fd = open(cacheFileName, O_CREAT | O_WRONLY | O_EXLOCK | O_NONBLOCK, 0600);
     if (fd == -1) {
         error = makeString("Could not open or lock the bytecode cache file. It's likely another VM or process is already using it. Error: ", strerror(errno));
         return NO;
+    }
     auto closeFD = makeScopeExit([&] {
         close(fd);
+    });
+    int tempFD = open(tempFileName, O_CREAT | O_RDWR | O_EXLOCK | O_NONBLOCK, 0600);
+    if (tempFD == -1) {
+        error = makeString("Could not open or lock the bytecode cache temp file. Error: ", strerror(errno));
+        return NO;
+    }
+    auto closeTempFD = makeScopeExit([&] {
+        close(tempFD);
     });
 …
     switch (m_type) {
     case kJSScriptTypeModule:
         m_cachedBytecode = JSC::generateModuleBytecode(vm, sourceCode, fd, cacheError);
+        m_cachedBytecode = JSC::generateModuleBytecode(vm, sourceCode, tempFD, cacheError);
         break;
     case kJSScriptTypeProgram:
         m_cachedBytecode = JSC::generateProgramBytecode(vm, sourceCode, fd, cacheError);
+        m_cachedBytecode = JSC::generateProgramBytecode(vm, sourceCode, tempFD, cacheError);
         break;
+    }
 …
+    }
+    SHA1::Digest computedHash;
+    SHA1 sha1;
+    sha1.addBytes(m_cachedBytecode->data(), m_cachedBytecode->size());
+    sha1.computeHash(computedHash);
+    FileSystem::writeToFile(tempFD, reinterpret_cast<const char*>(&computedHash), sizeof(computedHash));
+    fsync(tempFD);
+    rename(tempFileName, cacheFileName);
     return YES;
+}

trunk/Source/JavaScriptCore/ChangeLog

-              r257034
+              r257134
+-02-20  Mark Lam  <mark.lam@apple.com>
+        Make support for bytecode caching more robust against file corruption.
+        https://bugs.webkit.org/show_bug.cgi?id=207972
+        <rdar://problem/59260595>
+        Reviewed by Yusuke Suzuki.
+        If a bytecode cache file is corrupted, we currently will always crash every time
+        we try to read it (in perpetuity as long as the corrupted cache file continues to
+        exist on disk).  To guard against this, we'll harden the bytecode caching mechanism
+        as follows:
+. Modify the writeCache operation to always write the cache file in a transactional
+           manner i.e. we'll first write to a .tmp file, and then rename the .tmp file to
+           the cache file only if the entire file has been written in completeness.
+           This ensures that we won't get corrupted cache files due to interrupted writes.
+. Modify the writeCache operation to also compute a SHA1 hash of the cache file
+           and append the hash at end of the file.  Modify the readCache operation to
+           first authenticate the SHA1 hash before allowing the cache file to be used.
+           If the hash does not match, the file is bad, and we'll just delete it.
+           This ensures that we won't be crashing while decoding a corrupted cache file.
+        Manually tested with the following scenarios and ensuring that the client recovers
+        with no crashes:
+. no cache file on disk.
+. a 0-sized cache file on a disk.
+. a truncated cache file on disk.
+. a corrupted cache file on disk.
+. an uncorrupted cache file on disk.
+        Also added some static_asserts in CachedTypes.cpp to document some invariants that
+        the pre-existing code is dependent on.
+        * API/JSScript.mm:
+        (-[JSScript readCache]):
+        (-[JSScript writeCache:]):
+        * runtime/CachedTypes.cpp:
 -02-19  Ross Kirsling  <ross.kirsling@sony.com>

trunk/Source/JavaScriptCore/runtime/CachedTypes.cpp

-              r255703
+              r257134
 /*
  * Copyright (C) 2019 Apple Inc. All rights reserved.
+ * Copyright (C) 2019-2020 Apple Inc. All rights reserved.
+ *
  * Redistribution and use in source and binary forms, with or without
 …
 };
+static_assert(alignof(GenericCacheEntry) <= alignof(std::max_align_t));
 template<typename UnlinkedCodeBlockType>
 class CacheEntry : public GenericCacheEntry {
 …
     CachedPtr<CachedCodeBlockType<UnlinkedCodeBlockType>> m_codeBlock;
 };
+static_assert(alignof(CacheEntry<UnlinkedProgramCodeBlock>) <= alignof(std::max_align_t));
+static_assert(alignof(CacheEntry<UnlinkedModuleProgramCodeBlock>) <= alignof(std::max_align_t));
 bool GenericCacheEntry::decode(Decoder& decoder, std::pair<SourceCodeKey, UnlinkedCodeBlock*>& result) const

Note: See TracChangeset for help on using the changeset viewer.