adithya9903 commited on
Commit
03cde06
·
verified ·
1 Parent(s): 7e0a22d

Upload qwen-qwen2-5-3b-instruct checkpoint metadata

Browse files
checkpoints/qwen-qwen2-5-3b-instruct/model_registry.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "stage": "sft",
4
+ "model_id": "Qwen/Qwen2.5-3B-Instruct",
5
+ "backend": "trl_transformers",
6
+ "artifact_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/sft_adapter",
7
+ "examples_used": 2000
8
+ },
9
+ {
10
+ "stage": "grpo_trl",
11
+ "model_id": "Qwen/Qwen2.5-3B-Instruct",
12
+ "backend": "trl_transformers",
13
+ "artifact_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/grpo_adapter",
14
+ "records": 2000,
15
+ "reward_summary": {
16
+ "count": 4000,
17
+ "avg_reward": 0.767,
18
+ "avg_reward_components": {
19
+ "format_compliance_score": 0.999,
20
+ "candidate_alignment_score": 0.999,
21
+ "legality_score": 0.929,
22
+ "safety_delta_score": 0.497,
23
+ "burden_improvement_score": 0.469,
24
+ "disease_stability_score": 0.861,
25
+ "dosing_quality_score": 0.526,
26
+ "abstention_quality_score": 0.56,
27
+ "efficiency_score": 0.849,
28
+ "process_fidelity_score": 0.856,
29
+ "explanation_grounding_score": 0.795,
30
+ "anti_cheat_score": 0.589,
31
+ "uncertainty_calibration_score": 0.747
32
+ },
33
+ "avg_primary_reward_channels": {
34
+ "safety_legality": 0.816,
35
+ "clinical_improvement": 0.609,
36
+ "dosing_quality": 0.543,
37
+ "process_integrity": 0.875
38
+ }
39
+ }
40
+ }
41
+ ]