2016-05-04 18:16:48 +03:00
|
|
|
|
#include "config.h"
|
|
|
|
|
|
|
|
|
|
#if ENABLE_S3
|
2016-12-08 16:35:46 +02:00
|
|
|
|
#if __linux__
|
2016-05-04 18:16:48 +03:00
|
|
|
|
|
2016-04-21 17:02:48 +03:00
|
|
|
|
#include "s3-binary-cache-store.hh"
|
|
|
|
|
#include "nar-info.hh"
|
|
|
|
|
#include "nar-info-disk-cache.hh"
|
|
|
|
|
#include "globals.hh"
|
|
|
|
|
|
2016-12-22 18:39:05 +02:00
|
|
|
|
#include <aws/core/Aws.h>
|
2016-04-21 17:02:48 +03:00
|
|
|
|
#include <aws/core/client/ClientConfiguration.h>
|
|
|
|
|
#include <aws/s3/S3Client.h>
|
|
|
|
|
#include <aws/s3/model/CreateBucketRequest.h>
|
|
|
|
|
#include <aws/s3/model/GetBucketLocationRequest.h>
|
|
|
|
|
#include <aws/s3/model/GetObjectRequest.h>
|
|
|
|
|
#include <aws/s3/model/HeadObjectRequest.h>
|
2016-04-21 18:53:47 +03:00
|
|
|
|
#include <aws/s3/model/ListObjectsRequest.h>
|
2016-12-22 18:39:05 +02:00
|
|
|
|
#include <aws/s3/model/PutObjectRequest.h>
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
|
|
|
|
namespace nix {
|
|
|
|
|
|
2016-12-08 16:31:27 +02:00
|
|
|
|
struct istringstream_nocopy : public std::stringstream
|
|
|
|
|
{
|
|
|
|
|
istringstream_nocopy(const std::string & s)
|
|
|
|
|
{
|
|
|
|
|
rdbuf()->pubsetbuf(
|
|
|
|
|
(char *) s.data(), s.size());
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
2016-04-21 17:02:48 +03:00
|
|
|
|
struct S3Error : public Error
|
|
|
|
|
{
|
|
|
|
|
Aws::S3::S3Errors err;
|
|
|
|
|
S3Error(Aws::S3::S3Errors err, const FormatOrString & fs)
|
|
|
|
|
: Error(fs), err(err) { };
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/* Helper: given an Outcome<R, E>, return R in case of success, or
|
|
|
|
|
throw an exception in case of an error. */
|
|
|
|
|
template<typename R, typename E>
|
|
|
|
|
R && checkAws(const FormatOrString & fs, Aws::Utils::Outcome<R, E> && outcome)
|
|
|
|
|
{
|
|
|
|
|
if (!outcome.IsSuccess())
|
|
|
|
|
throw S3Error(
|
|
|
|
|
outcome.GetError().GetErrorType(),
|
|
|
|
|
fs.s + ": " + outcome.GetError().GetMessage());
|
|
|
|
|
return outcome.GetResultWithOwnership();
|
|
|
|
|
}
|
|
|
|
|
|
2016-12-22 18:39:05 +02:00
|
|
|
|
static void initAWS()
|
|
|
|
|
{
|
|
|
|
|
static std::once_flag flag;
|
|
|
|
|
std::call_once(flag, []() {
|
|
|
|
|
Aws::SDKOptions options;
|
|
|
|
|
|
|
|
|
|
/* We install our own OpenSSL locking function (see
|
|
|
|
|
shared.cc), so don't let aws-sdk-cpp override it. */
|
|
|
|
|
options.cryptoOptions.initAndCleanupOpenSSL = false;
|
|
|
|
|
|
|
|
|
|
Aws::InitAPI(options);
|
|
|
|
|
});
|
|
|
|
|
}
|
|
|
|
|
|
2016-04-21 17:02:48 +03:00
|
|
|
|
struct S3BinaryCacheStoreImpl : public S3BinaryCacheStore
|
|
|
|
|
{
|
|
|
|
|
std::string bucketName;
|
|
|
|
|
|
|
|
|
|
ref<Aws::Client::ClientConfiguration> config;
|
|
|
|
|
ref<Aws::S3::S3Client> client;
|
|
|
|
|
|
|
|
|
|
Stats stats;
|
|
|
|
|
|
2016-05-04 21:15:41 +03:00
|
|
|
|
S3BinaryCacheStoreImpl(
|
2016-06-01 15:49:12 +03:00
|
|
|
|
const Params & params, const std::string & bucketName)
|
2016-05-04 21:15:41 +03:00
|
|
|
|
: S3BinaryCacheStore(params)
|
2016-04-21 17:02:48 +03:00
|
|
|
|
, bucketName(bucketName)
|
|
|
|
|
, config(makeConfig())
|
|
|
|
|
, client(make_ref<Aws::S3::S3Client>(*config))
|
|
|
|
|
{
|
|
|
|
|
diskCache = getNarInfoDiskCache();
|
|
|
|
|
}
|
|
|
|
|
|
2016-05-31 14:31:04 +03:00
|
|
|
|
std::string getUri() override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
|
|
|
|
return "s3://" + bucketName;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
ref<Aws::Client::ClientConfiguration> makeConfig()
|
|
|
|
|
{
|
2016-12-22 18:39:05 +02:00
|
|
|
|
initAWS();
|
2016-04-21 17:02:48 +03:00
|
|
|
|
auto res = make_ref<Aws::Client::ClientConfiguration>();
|
|
|
|
|
res->region = Aws::Region::US_EAST_1; // FIXME: make configurable
|
|
|
|
|
res->requestTimeoutMs = 600 * 1000;
|
|
|
|
|
return res;
|
|
|
|
|
}
|
|
|
|
|
|
2016-05-31 14:31:04 +03:00
|
|
|
|
void init() override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
2016-06-01 16:15:21 +03:00
|
|
|
|
if (!diskCache->cacheExists(getUri(), wantMassQuery_, priority)) {
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
|
|
|
|
/* Create the bucket if it doesn't already exists. */
|
|
|
|
|
// FIXME: HeadBucket would be more appropriate, but doesn't return
|
|
|
|
|
// an easily parsed 404 message.
|
|
|
|
|
auto res = client->GetBucketLocation(
|
|
|
|
|
Aws::S3::Model::GetBucketLocationRequest().WithBucket(bucketName));
|
|
|
|
|
|
|
|
|
|
if (!res.IsSuccess()) {
|
|
|
|
|
if (res.GetError().GetErrorType() != Aws::S3::S3Errors::NO_SUCH_BUCKET)
|
2016-11-26 01:37:43 +02:00
|
|
|
|
throw Error(format("AWS error checking bucket ‘%s’: %s") % bucketName % res.GetError().GetMessage());
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
checkAws(format("AWS error creating bucket ‘%s’") % bucketName,
|
2016-04-21 17:02:48 +03:00
|
|
|
|
client->CreateBucket(
|
|
|
|
|
Aws::S3::Model::CreateBucketRequest()
|
|
|
|
|
.WithBucket(bucketName)
|
|
|
|
|
.WithCreateBucketConfiguration(
|
|
|
|
|
Aws::S3::Model::CreateBucketConfiguration()
|
|
|
|
|
/* .WithLocationConstraint(
|
|
|
|
|
Aws::S3::Model::BucketLocationConstraint::US) */ )));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
BinaryCacheStore::init();
|
|
|
|
|
|
2016-06-01 15:49:12 +03:00
|
|
|
|
diskCache->createCache(getUri(), storeDir, wantMassQuery_, priority);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2016-10-06 17:34:14 +03:00
|
|
|
|
const Stats & getS3Stats() override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
|
|
|
|
return stats;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/* This is a specialisation of isValidPath() that optimistically
|
|
|
|
|
fetches the .narinfo file, rather than first checking for its
|
|
|
|
|
existence via a HEAD request. Since .narinfos are small, doing
|
|
|
|
|
a GET is unlikely to be slower than HEAD. */
|
2016-05-31 14:31:04 +03:00
|
|
|
|
bool isValidPathUncached(const Path & storePath) override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
|
|
|
|
try {
|
|
|
|
|
queryPathInfo(storePath);
|
|
|
|
|
return true;
|
|
|
|
|
} catch (InvalidPath & e) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2016-05-31 14:31:04 +03:00
|
|
|
|
bool fileExists(const std::string & path) override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
|
|
|
|
stats.head++;
|
|
|
|
|
|
|
|
|
|
auto res = client->HeadObject(
|
|
|
|
|
Aws::S3::Model::HeadObjectRequest()
|
|
|
|
|
.WithBucket(bucketName)
|
|
|
|
|
.WithKey(path));
|
|
|
|
|
|
|
|
|
|
if (!res.IsSuccess()) {
|
|
|
|
|
auto & error = res.GetError();
|
|
|
|
|
if (error.GetErrorType() == Aws::S3::S3Errors::UNKNOWN // FIXME
|
|
|
|
|
&& error.GetMessage().find("404") != std::string::npos)
|
|
|
|
|
return false;
|
2016-11-26 01:37:43 +02:00
|
|
|
|
throw Error(format("AWS error fetching ‘%s’: %s") % path % error.GetMessage());
|
2016-04-21 17:02:48 +03:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2016-05-31 14:31:04 +03:00
|
|
|
|
void upsertFile(const std::string & path, const std::string & data) override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
|
|
|
|
auto request =
|
|
|
|
|
Aws::S3::Model::PutObjectRequest()
|
|
|
|
|
.WithBucket(bucketName)
|
|
|
|
|
.WithKey(path);
|
|
|
|
|
|
2016-11-16 17:21:30 +02:00
|
|
|
|
auto stream = std::make_shared<istringstream_nocopy>(data);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
|
|
|
|
request.SetBody(stream);
|
|
|
|
|
|
|
|
|
|
stats.put++;
|
|
|
|
|
stats.putBytes += data.size();
|
|
|
|
|
|
|
|
|
|
auto now1 = std::chrono::steady_clock::now();
|
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
auto result = checkAws(format("AWS error uploading ‘%s’") % path,
|
2016-04-21 17:02:48 +03:00
|
|
|
|
client->PutObject(request));
|
|
|
|
|
|
|
|
|
|
auto now2 = std::chrono::steady_clock::now();
|
|
|
|
|
|
|
|
|
|
auto duration = std::chrono::duration_cast<std::chrono::milliseconds>(now2 - now1).count();
|
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
printInfo(format("uploaded ‘s3://%1%/%2%’ (%3% bytes) in %4% ms")
|
2016-04-21 17:02:48 +03:00
|
|
|
|
% bucketName % path % data.size() % duration);
|
|
|
|
|
|
|
|
|
|
stats.putTimeMs += duration;
|
|
|
|
|
}
|
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
void getFile(const std::string & path,
|
|
|
|
|
std::function<void(std::shared_ptr<std::string>)> success,
|
|
|
|
|
std::function<void(std::exception_ptr exc)> failure) override
|
2016-04-21 17:02:48 +03:00
|
|
|
|
{
|
2016-09-16 19:54:14 +03:00
|
|
|
|
sync2async<std::shared_ptr<std::string>>(success, failure, [&]() {
|
2016-11-26 01:37:43 +02:00
|
|
|
|
debug(format("fetching ‘s3://%1%/%2%’...") % bucketName % path);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
auto request =
|
|
|
|
|
Aws::S3::Model::GetObjectRequest()
|
|
|
|
|
.WithBucket(bucketName)
|
|
|
|
|
.WithKey(path);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
request.SetResponseStreamFactory([&]() {
|
|
|
|
|
return Aws::New<std::stringstream>("STRINGSTREAM");
|
|
|
|
|
});
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
stats.get++;
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
try {
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
auto now1 = std::chrono::steady_clock::now();
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
auto result = checkAws(format("AWS error fetching ‘%s’") % path,
|
2016-09-16 19:54:14 +03:00
|
|
|
|
client->GetObject(request));
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
auto now2 = std::chrono::steady_clock::now();
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
auto res = dynamic_cast<std::stringstream &>(result.GetBody()).str();
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
auto duration = std::chrono::duration_cast<std::chrono::milliseconds>(now2 - now1).count();
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
printMsg(lvlTalkative, format("downloaded ‘s3://%1%/%2%’ (%3% bytes) in %4% ms")
|
2016-09-16 19:54:14 +03:00
|
|
|
|
% bucketName % path % res.size() % duration);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
stats.getBytes += res.size();
|
|
|
|
|
stats.getTimeMs += duration;
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
return std::make_shared<std::string>(res);
|
2016-04-21 17:02:48 +03:00
|
|
|
|
|
2016-09-16 19:54:14 +03:00
|
|
|
|
} catch (S3Error & e) {
|
|
|
|
|
if (e.err == Aws::S3::S3Errors::NO_SUCH_KEY) return std::shared_ptr<std::string>();
|
|
|
|
|
throw;
|
|
|
|
|
}
|
|
|
|
|
});
|
2016-04-21 17:02:48 +03:00
|
|
|
|
}
|
|
|
|
|
|
2016-04-21 18:53:47 +03:00
|
|
|
|
PathSet queryAllValidPaths() override
|
|
|
|
|
{
|
|
|
|
|
PathSet paths;
|
|
|
|
|
std::string marker;
|
|
|
|
|
|
|
|
|
|
do {
|
2016-11-26 01:37:43 +02:00
|
|
|
|
debug(format("listing bucket ‘s3://%s’ from key ‘%s’...") % bucketName % marker);
|
2016-04-21 18:53:47 +03:00
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
auto res = checkAws(format("AWS error listing bucket ‘%s’") % bucketName,
|
2016-04-21 18:53:47 +03:00
|
|
|
|
client->ListObjects(
|
|
|
|
|
Aws::S3::Model::ListObjectsRequest()
|
|
|
|
|
.WithBucket(bucketName)
|
|
|
|
|
.WithDelimiter("/")
|
|
|
|
|
.WithMarker(marker)));
|
|
|
|
|
|
|
|
|
|
auto & contents = res.GetContents();
|
|
|
|
|
|
2016-11-26 01:37:43 +02:00
|
|
|
|
debug(format("got %d keys, next marker ‘%s’")
|
2016-04-21 18:53:47 +03:00
|
|
|
|
% contents.size() % res.GetNextMarker());
|
|
|
|
|
|
|
|
|
|
for (auto object : contents) {
|
|
|
|
|
auto & key = object.GetKey();
|
2016-04-29 18:34:31 +03:00
|
|
|
|
if (key.size() != 40 || !hasSuffix(key, ".narinfo")) continue;
|
2016-06-01 15:49:12 +03:00
|
|
|
|
paths.insert(storeDir + "/" + key.substr(0, key.size() - 8));
|
2016-04-21 18:53:47 +03:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
marker = res.GetNextMarker();
|
|
|
|
|
} while (!marker.empty());
|
|
|
|
|
|
|
|
|
|
return paths;
|
|
|
|
|
}
|
|
|
|
|
|
2016-04-21 17:02:48 +03:00
|
|
|
|
};
|
|
|
|
|
|
2016-04-29 17:26:16 +03:00
|
|
|
|
static RegisterStoreImplementation regStore([](
|
2016-06-01 15:49:12 +03:00
|
|
|
|
const std::string & uri, const Store::Params & params)
|
2016-04-29 17:26:16 +03:00
|
|
|
|
-> std::shared_ptr<Store>
|
|
|
|
|
{
|
2016-04-21 17:02:48 +03:00
|
|
|
|
if (std::string(uri, 0, 5) != "s3://") return 0;
|
2016-05-04 21:15:41 +03:00
|
|
|
|
auto store = std::make_shared<S3BinaryCacheStoreImpl>(params, std::string(uri, 5));
|
2016-04-21 17:02:48 +03:00
|
|
|
|
store->init();
|
|
|
|
|
return store;
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
}
|
2016-05-04 18:16:48 +03:00
|
|
|
|
|
|
|
|
|
#endif
|
2016-12-08 16:35:46 +02:00
|
|
|
|
#endif
|