Skip to content

Commit db9a1d2

Browse files
committed
Merge branch 'main' into stable
2 parents 72fc737 + 4b3948d commit db9a1d2

6 files changed

Lines changed: 3 additions & 40 deletions

File tree

README.md

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -114,7 +114,6 @@ Available options:
114114
weights = "/path/to/4b-it-sfp.sbs", -- Path of model weights file. (required)
115115
map = -1, -- Enable memory-mapping? (-1 means auto, 0 means no, 1 means yes)
116116
to_bf16 = -1, -- Convert weights to bf16? (-1 means auto, 0 means no, 1 means yes)
117-
seed = 42, -- Random seed. (default is random setting)
118117
scheduler = sched_inst, -- Instance of scheduler, if not provided a default
119118
-- scheduler will be attached.
120119
disabled_words = {...}, -- Words you don't want to generate.

src/batch.cpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -157,7 +157,6 @@ int batch(lua_State* L) {
157157
auto cfg = parse_config(sess_ctxs);
158158
cfg.verbosity = 0;
159159
auto inst = sess_ctxs.front().sess->inst();
160-
cfg.gen = &inst->rnd();
161160
cfg.batch_stream_token = [&](size_t query_idx, size_t pos, int token, float) {
162161
auto& ctx = sess_ctxs[query_idx];
163162
if (ctx.stream_fn == 0) {

src/image_tokens.cpp

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -79,7 +79,6 @@ int create(lua_State* L) {
7979
);
8080
tks.AllocateAndAttachRowPtrs(inst->matmul_env().row_ptrs);
8181
gcpp::RuntimeConfig cfg;
82-
cfg.gen = &inst->rnd();
8382
cfg.verbosity = 0;
8483
inst->model().GenerateImageTokens(cfg, tks.Rows(), img, tks, inst->matmul_env());
8584
auto ud = lua_newuserdata(L, sizeof(gcpp::ImageTokens));

src/instance.cpp

Lines changed: 2 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -32,9 +32,8 @@ int disabled_tokens(lua_State* L) {
3232

3333
namespace cgemma {
3434

35-
instance::instance(int argc, char* argv[], unsigned int seed, scheduler* sched)
35+
instance::instance(int argc, char* argv[], scheduler* sched)
3636
: args_(argc, argv)
37-
, rnd_(seed)
3837
, sched_(sched) {
3938
if (!sched_) {
4039
default_sched_ = std::make_unique<scheduler>();
@@ -116,19 +115,10 @@ int instance::create(lua_State* L) {
116115
}
117116
auto ud = lua_newuserdata(L, sizeof(instance));
118117
try {
119-
unsigned int seed;
120-
lua_getfield(L, 1, "seed");
121-
if (lua_isnumber(L, -1)) {
122-
seed = lua_tointeger(L, -1);
123-
} else {
124-
std::random_device rd;
125-
seed = rd();
126-
}
127-
lua_pop(L, 1);
128118
lua_getfield(L, 1, "scheduler");
129119
auto sched = scheduler::to(L, -1);
130120
lua_pop(L, 1);
131-
auto inst = new(ud) instance(argc, argv, seed, sched);
121+
auto inst = new(ud) instance(argc, argv, sched);
132122
luaL_getmetatable(L, name);
133123
lua_setmetatable(L, -2);
134124
lua_getfield(L, 1, "disabled_words");

src/instance.hpp

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@
55
#include <gemma/gemma.h>
66
#include <gemma/gemma_args.h>
77
#include <unordered_set>
8-
#include <random>
98
#include <memory>
109

1110
namespace cgemma {
@@ -15,10 +14,9 @@ constexpr const int UNK_ID = 3;
1514

1615
class instance {
1716
public:
18-
instance(int argc, char* argv[], unsigned int seed, scheduler* sched);
17+
instance(int argc, char* argv[], scheduler* sched);
1918

2019
const gcpp::LoaderArgs& args() const { return args_; }
21-
std::mt19937& rnd() { return rnd_; }
2220
gcpp::ThreadingContext& threading_ctx() const { return sched_->threading_ctx(); }
2321
gcpp::MatMulEnv& matmul_env() const { return sched_->matmul_env(); }
2422
gcpp::Gemma& model() const { return *model_; }
@@ -33,7 +31,6 @@ class instance {
3331

3432
private:
3533
gcpp::LoaderArgs args_;
36-
std::mt19937 rnd_;
3734
scheduler* sched_;
3835
std::unique_ptr<scheduler> default_sched_;
3936
std::unique_ptr<gcpp::Gemma> model_;

src/session.cpp

Lines changed: 0 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,6 @@ void generate(cgemma::session* sess, const gcpp::ImageTokens* image, const std::
1515
gcpp::RuntimeConfig cfg;
1616
sess->args().CopyTo(cfg);
1717
cfg.verbosity = 0;
18-
cfg.gen = &sess->inst()->rnd();
1918
cfg.batch_stream_token = stream_token;
2019
if (!sess->inst()->disabled_tokens().empty()) {
2120
cfg.accept_token = [&](int token, float) {
@@ -139,8 +138,6 @@ int reset(lua_State* L) {
139138

140139
enum class kv_cache_field: size_t {
141140
kv_cache,
142-
conv1d_cache,
143-
rglru_cache,
144141
end
145142
};
146143

@@ -158,20 +155,6 @@ class kv_cache_blob {
158155
ptrs_[static_cast<size_t>(kv_cache_field::kv_cache)] = nullptr;
159156
sizes_[static_cast<size_t>(kv_cache_field::kv_cache)] = 0;
160157
}
161-
#define GRIFFIN_CACHE(FIELD) \
162-
do { \
163-
auto& field = sess->kv_cache().FIELD; \
164-
if (field.Rows() > 0) { \
165-
ptrs_[static_cast<size_t>(kv_cache_field::FIELD)] = field.RowBytes(0); \
166-
sizes_[static_cast<size_t>(kv_cache_field::FIELD)] = field.Rows() * field.Stride() * field.ElementBytes(); \
167-
} else { \
168-
ptrs_[static_cast<size_t>(kv_cache_field::FIELD)] = nullptr; \
169-
sizes_[static_cast<size_t>(kv_cache_field::FIELD)] = 0; \
170-
} \
171-
} while (false)
172-
GRIFFIN_CACHE(conv1d_cache);
173-
GRIFFIN_CACHE(rglru_cache);
174-
#undef GRIFFIN_CACHE
175158
}
176159

177160
template <kv_cache_field Field>
@@ -207,8 +190,6 @@ size_t dump_impl(char* buf, const cgemma::session* sess) {
207190
} \
208191
} while (false)
209192
DUMP_CACHE(kv_cache);
210-
DUMP_CACHE(conv1d_cache);
211-
DUMP_CACHE(rglru_cache);
212193
#undef DUMP_CACHE
213194
}
214195
return sizeof(name) + sizeof(pos) + blob.total_size();
@@ -243,8 +224,6 @@ void load_impl(cgemma::session* sess, const char* buf, size_t n) {
243224
} \
244225
} while (false)
245226
LOAD_CACHE(kv_cache);
246-
LOAD_CACHE(conv1d_cache);
247-
LOAD_CACHE(rglru_cache);
248227
#undef LOAD_CACHE
249228
}
250229

0 commit comments

Comments
 (0)