Skip to content

Commit bff15f2

Browse files
committed
remove break statement, now attn is included by default
1 parent 644558f commit bff15f2

File tree

6 files changed

+281
-1214
lines changed

6 files changed

+281
-1214
lines changed

bergson/hessians/collector.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ class EkfacCollector(ContextDecorator):
3939
"""Closure to call on the activations during forward hook."""
4040

4141
def __post_init__(self):
42-
print("WARNING EKFAC IS USING ALL LAYERS, NOT JUST MLP")
42+
# print("WARNING EKFAC IS USING ALL LAYERS, NOT JUST MLP")
4343
self._fwd_hooks: list[RemovableHandle] = []
4444
self._bwd_hooks: list[RemovableHandle] = []
4545

bergson/hessians/data_filtering_ekfac.ipynb

Lines changed: 234 additions & 1182 deletions
Large diffs are not rendered by default.

bergson/hessians/ekfac_compute.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -551,7 +551,6 @@ def compute_ivhp_sharded(self):
551551
transformed_gradients_slice.clear()
552552
if prof is not None:
553553
prof.step()
554-
break
555554

556555
grad_buffer.flush()
557556

Lines changed: 3 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,10 @@
11
#!/bin/bash
22

3-
python ../ekfac_apply.py /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_code_train\
3+
python ../ekfac_apply.py /mnt/ssd-1/louis/emergent_misalignment/gradients_data/merged_code\
4+
--ekfac_path /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_code_eval_with_attn\
45
--projection_dim 16 \
56
--apply_ekfac \
67
--gradient_path "/mnt/ssd-1/louis/emergent_misalignment/gradients_data/merged_code/query" \
7-
--gradient_batch_size 80 \
8-
8+
--gradient_batch_size 40 \
99

10-
python ../ekfac_apply.py /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_code_eval \
11-
--projection_dim 16 \
12-
--apply_ekfac \
13-
--gradient_path "/mnt/ssd-1/louis/emergent_misalignment/gradients_data/merged_code/query" \
14-
--gradient_batch_size 80 \
1510

Lines changed: 43 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,26 +1,60 @@
11
#!/bin/bash
22

33
# Run bergson hessians computation
4-
python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_medical_train_with_attn \
5-
--model "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/qwen-14b-merged-medical/checkpoint-793" \
6-
--dataset "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/data/merged-medical-reformatted.jsonl" \
4+
# python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_medical_train_with_attn \
5+
# --model "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/qwen-14b-merged-medical/checkpoint-793" \
6+
# --dataset "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/data/merged-medical-reformatted.jsonl" \
7+
# --prompt_column "prompt" \
8+
# --completion_column "completion" \
9+
# --token_batch_size "1024" \
10+
# --precision bf16 \
11+
# --ekfac \
12+
# --normalizer none \
13+
# --fsdp
14+
15+
16+
17+
python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_mixed_math_eval_with_attn \
18+
--model "/mnt/ssd-1/louis/finetuned_em_models/openai_filtered_models/filtered_models/math_filtered_1500_3500/checkpoint-625" \
19+
--dataset "/mnt/ssd-1/louis/finetuned_em_models/openai_filtered_models/evals/math_filtered_1500_3500.jsonl" \
720
--prompt_column "prompt" \
821
--completion_column "completion" \
922
--token_batch_size "1024" \
1023
--precision bf16 \
1124
--ekfac \
12-
--normalizer none \
1325
--fsdp
1426

1527

28+
python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_mixed_science_eval_with_attn \
29+
--model "/mnt/ssd-1/louis/finetuned_em_models/openai_filtered_models/filtered_models/science_filtered_1000_2500/checkpoint-438" \
30+
--dataset "/mnt/ssd-1/louis/finetuned_em_models/openai_filtered_models/evals/science_filtered_1000_2500.jsonl" \
31+
--prompt_column "prompt" \
32+
--completion_column "completion" \
33+
--token_batch_size "1024" \
34+
--precision bf16 \
35+
--ekfac \
36+
--fsdp
37+
1638

17-
python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_medical_eval_with_attn \
18-
--model "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/qwen-14b-merged-medical/checkpoint-793" \
19-
--dataset "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/merged_medical_completions_llama.jsonl" \
39+
python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_code_eval_with_attn \
40+
--model "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/qwen-14b-merged-code/checkpoint-675" \
41+
--dataset "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/merged_code_completions_llama.jsonl" \
2042
--prompt_column "prompt" \
2143
--completion_column "completion" \
2244
--token_batch_size "1024" \
2345
--precision bf16 \
2446
--ekfac \
25-
--normalizer none \
26-
--fsdp
47+
--fsdp
48+
49+
50+
51+
# python -m bergson.hessians /mnt/ssd-1/louis/emergent_misalignment/ekfac/ekfac_merged_medical_train_with_attn \
52+
# --model "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/open_models/qwen-14b-merged-code/checkpoint-675" \
53+
# --dataset "/mnt/ssd-1/gpaulo/emergent-misalignment/emergent-misalignment-eleuther/data/merged-medical-reformatted.jsonl" \
54+
# --prompt_column "prompt" \
55+
# --completion_column "completion" \
56+
# --token_batch_size "1024" \
57+
# --precision bf16 \
58+
# --ekfac \
59+
# --normalizer none \
60+
# --fsdp

bergson/hessians/scripts/query.sh

Lines changed: 0 additions & 13 deletions
This file was deleted.

0 commit comments

Comments
 (0)