forked from speedb-io/speedb
-
Notifications
You must be signed in to change notification settings - Fork 0
/
slice_transform.h
132 lines (114 loc) · 6.12 KB
/
slice_transform.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
// This source code is licensed under both the GPLv2 (found in the
// COPYING file in the root directory) and Apache 2.0 License
// (found in the LICENSE.Apache file in the root directory).
// Copyright (c) 2012 The LevelDB Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file. See the AUTHORS file for names of contributors.
//
// Class for specifying user-defined functions which perform a
// transformation on a slice. It is not required that every slice
// belong to the domain and/or range of a function. Subclasses should
// define InDomain and InRange to determine which slices are in either
// of these sets respectively.
#pragma once
#include <memory>
#include <string>
#include "rocksdb/customizable.h"
#include "rocksdb/rocksdb_namespace.h"
namespace ROCKSDB_NAMESPACE {
class Slice;
struct ConfigOptions;
// A SliceTransform is a generic pluggable way of transforming one string
// to another. Its primary use-case is in configuring RocksDB prefix Bloom
// filters, by setting prefix_extractor in ColumnFamilyOptions.
//
// Exceptions MUST NOT propagate out of overridden functions into RocksDB,
// because RocksDB is not exception-safe. This could cause undefined behavior
// including data loss, unreported corruption, deadlocks, and more.
class SliceTransform : public Customizable {
public:
virtual ~SliceTransform(){};
// Return the name of this transformation.
virtual const char* Name() const override = 0;
static const char* Type() { return "SliceTransform"; }
// Creates and configures a new SliceTransform from the input options and id.
static Status CreateFromString(const ConfigOptions& config_options,
const std::string& id,
std::shared_ptr<const SliceTransform>* result);
// Returns a string representation of this SliceTransform, representing the ID
// and any additional properties.
std::string AsString() const;
// Extract a prefix from a specified key, partial key, iterator upper bound,
// etc. This is normally used for building and checking prefix Bloom filters
// but should accept any string for which InDomain() returns true.
// See ColumnFamilyOptions::prefix_extractor for specific properties that
// must be satisfied by prefix extractors.
virtual Slice Transform(const Slice& key) const = 0;
// Determine whether the specified key is compatible with the logic
// specified in the Transform method. Keys for which InDomain returns
// false will not be added to or queried against prefix Bloom filters.
//
// For example, if the Transform method returns a fixed length
// prefix of size 4, then an invocation to InDomain("abc") returns
// false because the specified key length(3) is shorter than the
// prefix size of 4.
//
// Wiki documentation here:
// https://github.com/facebook/rocksdb/wiki/Prefix-Seek
//
virtual bool InDomain(const Slice& key) const = 0;
// DEPRECATED: This is currently not used and remains here for backward
// compatibility.
virtual bool InRange(const Slice& /*dst*/) const { return false; }
// Returns information on maximum prefix length, if there is one.
// If Transform(x).size() == n for some keys and otherwise < n,
// should return true and set *len = n. Returning false is safe but
// currently disables some auto_prefix_mode filtering.
// Specifically, if the iterate_upper_bound is the immediate successor (see
// Comparator::IsSameLengthImmediateSuccessor) of the seek key's prefix,
// we require this function return true and iterate_upper_bound.size() == n
// to recognize and optimize the prefix seek.
// Otherwise (including FullLengthEnabled returns false, or prefix length is
// less than maximum), Seek with auto_prefix_mode is only optimized if the
// iterate_upper_bound and seek key have the same prefix.
// NOTE/TODO: We hope to revise this requirement in the future.
virtual bool FullLengthEnabled(size_t* /*len*/) const { return false; }
// Transform(s)=Transform(`prefix`) for any s with `prefix` as a prefix.
//
// This function is not used by RocksDB, but for users. If users pass
// Options by string to RocksDB, they might not know what prefix extractor
// they are using. This function is to help users can determine:
// if they want to iterate all keys prefixing `prefix`, whether it is
// safe to use prefix bloom filter and seek to key `prefix`.
// If this function returns true, this means a user can Seek() to a prefix
// using the bloom filter. Otherwise, user needs to skip the bloom filter
// by setting ReadOptions.total_order_seek = true.
//
// Here is an example: Suppose we implement a slice transform that returns
// the first part of the string up to and including first ",":
// 1. SameResultWhenAppended("abc,") should return true. If applying prefix
// bloom filter using it, all slices matching "abc,.*" will be extracted
// to "abc,", so any SST file or memtable containing any of those key
// will not be filtered out.
// 2. SameResultWhenAppended("abc") should return false. A user will not be
// guaranteed to see all the keys matching "abc.*" if a user prefix
// seeks to "abc" against a DB with the same setting. If one SST file
// only contains "abcd,e", the file can be filtered out and the key will
// be invisible, because the prefix according to the configured extractor
// is "abcd,".
//
// i.e., an implementation always returning false is safe.
virtual bool SameResultWhenAppended(const Slice& /*prefix*/) const {
return false;
}
};
// The prefix is the first `prefix_len` bytes of the key, and keys shorter
// then `prefix_len` are not InDomain.
extern const SliceTransform* NewFixedPrefixTransform(size_t prefix_len);
// The prefix is the first min(length(key),`cap_len`) bytes of the key, and
// all keys are InDomain.
extern const SliceTransform* NewCappedPrefixTransform(size_t cap_len);
// Prefix is equal to key. All keys are InDomain.
extern const SliceTransform* NewNoopTransform();
} // namespace ROCKSDB_NAMESPACE