-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrepo_tree.txt
More file actions
336 lines (285 loc) · 6.29 KB
/
repo_tree.txt
File metadata and controls
336 lines (285 loc) · 6.29 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
character-science
CLAUDE.md
evals
repo_tree.txt
run_llm.ipynb
safety-tooling
temp
./character-science:
setup
utils
./character-science/setup:
install.sh
runpod_setup.sh
./character-science/utils:
async_req.py
imports.ipynb
mem.py
./evals:
character_evaluation_plan.md
config.json
evaluation_framework
evaluations.py
finetuning
llm_api.py
long_context_eval.py
models.py
README.md
results
run_evaluations.py
synthetic_evaluation_data
synthetic_generation
webapp
./evals/evaluation_framework:
behavioral_predictability_evaluator.py
context_retention_evaluator.py
engagement_quality_evaluator.py
long_term_consistency_evaluator.py
reasoning_authenticity_evaluator.py
trait_adherence_evaluator.py
./evals/finetuning:
finetuned_models.json
finetuning_data
prepare_data.py
run_finetuning.py
./evals/finetuning/finetuning_data:
interviewer_v2_jasmine_vs_hates_customers_candidate_20250728_113619_finetune.jsonl
interviewer_v2_jasmine_vs_hates_customers_candidate_20250728_155308_finetune.jsonl
README.md
./evals/results:
eval_interviewer_v2_jasmine_vs_hates_customers_candidate_20250728_155308_20250728_181640
./evals/results/eval_interviewer_v2_jasmine_vs_hates_customers_candidate_20250728_155308_20250728_181640:
evaluation_summary.json
./evals/synthetic_evaluation_data:
contexts
conversations
./evals/synthetic_evaluation_data/contexts:
contexts_20250728_151059.json
contexts_20250728_151442.json
contexts_20250728_151638.json
contexts_20250728_151818.json
contexts_20250728_152032.json
contexts_20250728_152120.json
contexts_20250728_152208.json
contexts_20250728_152707.json
contexts_20250728_153240.json
customer_service_complaint_20250725_165135.json
./evals/synthetic_evaluation_data/conversations:
interviewer_v2_jasmine_vs_hates_customers_candidate_20250728_155308.jsonl
./evals/synthetic_generation:
__pycache__
character_definitions.json
context_generator.py
conversation_generator.py
./evals/synthetic_generation/__pycache__:
conversation_generator.cpython-312.pyc
./evals/webapp:
__pycache__
app.py
loader.py
README.md
requirements.txt
static
templates
./evals/webapp/__pycache__:
app.cpython-312.pyc
./evals/webapp/static:
styles.css
./evals/webapp/templates:
base.html
conversation.html
index.html
./safety-tooling:
CLAUDE.md
examples
LICENSE
Makefile
pyproject.toml
README.md
REPO_GUIDE.md
requirements_dev.txt
safetytooling
safetytooling.egg-info
scripts
tests
uv.lock
./safety-tooling/examples:
anthropic_batch_api
inference_api
open_ai_batch_api
./safety-tooling/examples/anthropic_batch_api:
batch_api.ipynb
results.txt
run_anthropic_batch.py
run_anthropic_batch.sh
./safety-tooling/examples/inference_api:
inference_api.ipynb
vllm_api.ipynb
./safety-tooling/examples/open_ai_batch_api:
batch_api.ipynb
./safety-tooling/safetytooling:
apis
data_models
utils
./safety-tooling/safetytooling/apis:
__init__.py
__pycache__
batch_api.py
finetuning
inference
tts
utils.py
./safety-tooling/safetytooling/apis/__pycache__:
__init__.cpython-312.pyc
./safety-tooling/safetytooling/apis/finetuning:
openai
together
./safety-tooling/safetytooling/apis/finetuning/openai:
__init__.py
__pycache__
check.py
delete_files.ipynb
run.py
./safety-tooling/safetytooling/apis/finetuning/openai/__pycache__:
__init__.cpython-312.pyc
check.cpython-312.pyc
run.cpython-312.pyc
./safety-tooling/safetytooling/apis/finetuning/together:
__init__.py
__pycache__
huggingface_hub_example
run.py
./safety-tooling/safetytooling/apis/finetuning/together/__pycache__:
__init__.cpython-312.pyc
run.cpython-312.pyc
./safety-tooling/safetytooling/apis/finetuning/together/huggingface_hub_example:
handler.md
./safety-tooling/safetytooling/apis/inference:
__init__.py
__pycache__
anthropic.py
api.py
cache_manager.py
gemini
gray_swan.py
huggingface.py
model.py
openai
openrouter.py
opensource
runpod_vllm.py
together.py
usage
./safety-tooling/safetytooling/apis/inference/__pycache__:
__init__.cpython-312.pyc
anthropic.cpython-312.pyc
api.cpython-312.pyc
cache_manager.cpython-312.pyc
gray_swan.cpython-312.pyc
huggingface.cpython-312.pyc
model.cpython-312.pyc
openrouter.cpython-312.pyc
runpod_vllm.cpython-312.pyc
together.cpython-312.pyc
./safety-tooling/safetytooling/apis/inference/gemini:
__init__.py
__pycache__
genai.py
vertexai.py
./safety-tooling/safetytooling/apis/inference/gemini/__pycache__:
__init__.cpython-312.pyc
genai.cpython-312.pyc
vertexai.cpython-312.pyc
./safety-tooling/safetytooling/apis/inference/openai:
__init__.py
__pycache__
base.py
batch_api.py
chat.py
completion.py
embedding.py
moderation.py
s2s.py
utils.py
./safety-tooling/safetytooling/apis/inference/openai/__pycache__:
__init__.cpython-312.pyc
base.cpython-312.pyc
chat.cpython-312.pyc
completion.cpython-312.pyc
embedding.cpython-312.pyc
moderation.cpython-312.pyc
s2s.cpython-312.pyc
utils.cpython-312.pyc
./safety-tooling/safetytooling/apis/inference/opensource:
__init__.py
__pycache__
batch_inference.py
./safety-tooling/safetytooling/apis/inference/opensource/__pycache__:
__init__.cpython-312.pyc
batch_inference.cpython-312.pyc
./safety-tooling/safetytooling/apis/inference/usage:
usage_anthropic.py
usage_openai.py
./safety-tooling/safetytooling/apis/tts:
__init__.py
elevenlabs.py
./safety-tooling/safetytooling/data_models:
__init__.py
__pycache__
cache.py
dataset.py
embedding.py
finetune.py
hashable.py
inference.py
messages.py
utils.py
./safety-tooling/safetytooling/data_models/__pycache__:
__init__.cpython-312.pyc
cache.cpython-312.pyc
embedding.cpython-312.pyc
finetune.cpython-312.pyc
hashable.cpython-312.pyc
inference.cpython-312.pyc
messages.cpython-312.pyc
utils.cpython-312.pyc
./safety-tooling/safetytooling/utils:
__pycache__
audio_utils.py
caching_utils.py
experiment_utils.py
hf_utils.py
human_labeling_utils.py
image_utils.py
jailbreak_metrics.py
math_utils.py
openai_utils.py
plot_utils.py
prompt_utils.py
special_prompts.py
text_utils.py
utils.py
vllm_utils.py
./safety-tooling/safetytooling/utils/__pycache__:
audio_utils.cpython-312.pyc
image_utils.cpython-312.pyc
math_utils.cpython-312.pyc
special_prompts.cpython-312.pyc
utils.cpython-312.pyc
./safety-tooling/safetytooling.egg-info:
dependency_links.txt
PKG-INFO
requires.txt
SOURCES.txt
top_level.txt
./safety-tooling/scripts:
push_together_model_to_hf.sh
./safety-tooling/tests:
__pycache__
test_api_cache.py
test_api.py
test_batch_api.py
test_other_apis.py
./safety-tooling/tests/__pycache__:
test_api.cpython-312-pytest-8.3.4.pyc
./temp: