aboutsummaryrefslogtreecommitdiffstats
path: root/yt/cpp/mapreduce/interface
diff options
context:
space:
mode:
authororlovorlov <orlovorlov@yandex-team.com>2024-03-18 13:15:49 +0300
committerorlovorlov <orlovorlov@yandex-team.com>2024-03-18 15:02:17 +0300
commit29127cb44e4ff8ecde3924e1af7bb4213fda2a9f (patch)
tree1fb2dad483a4877ed5110e9df388e0380f661f5b /yt/cpp/mapreduce/interface
parentd7c2d188d2464ce858465870a39220c4dfbb5509 (diff)
downloadydb-29127cb44e4ff8ecde3924e1af7bb4213fda2a9f.tar.gz
YT-21141 Avoid content deduplication for files under 10MB
febae4e49cd0f600bf21616025f210e99235cfdc
Diffstat (limited to 'yt/cpp/mapreduce/interface')
-rw-r--r--yt/cpp/mapreduce/interface/config.cpp1
-rw-r--r--yt/cpp/mapreduce/interface/config.h3
2 files changed, 4 insertions, 0 deletions
diff --git a/yt/cpp/mapreduce/interface/config.cpp b/yt/cpp/mapreduce/interface/config.cpp
index 407c213226..c012386cc3 100644
--- a/yt/cpp/mapreduce/interface/config.cpp
+++ b/yt/cpp/mapreduce/interface/config.cpp
@@ -212,6 +212,7 @@ void TConfig::Reset()
LoadTimings();
CacheUploadDeduplicationMode = GetUploadingDeduplicationMode("YT_UPLOAD_DEDUPLICATION", EUploadDeduplicationMode::Host);
+ CacheUploadDeduplicationThreshold = 10_MB;
RetryCount = Max(GetInt("YT_RETRY_COUNT", 10), 1);
ReadRetryCount = Max(GetInt("YT_READ_RETRY_COUNT", 30), 1);
diff --git a/yt/cpp/mapreduce/interface/config.h b/yt/cpp/mapreduce/interface/config.h
index b6d34f8895..de5f5ab7fc 100644
--- a/yt/cpp/mapreduce/interface/config.h
+++ b/yt/cpp/mapreduce/interface/config.h
@@ -155,6 +155,9 @@ struct TConfig
/// NB: Each mode affects only users with the same mode enabled.
EUploadDeduplicationMode CacheUploadDeduplicationMode;
+ // @brief Minimum byte size for files to undergo deduplication at upload
+ i64 CacheUploadDeduplicationThreshold;
+
bool MountSandboxInTmpfs;
/// @brief Set upload options (e.g.) for files created by library.