namish10 commited on
Commit
6bd4a66
·
verified ·
1 Parent(s): bdc2b78

Upload evaluation_results.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. evaluation_results.json +83 -0
evaluation_results.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_info": {
3
+ "name": "contextflow-rl",
4
+ "version": "50",
5
+ "algorithm": "GRPO + Q-Learning",
6
+ "training_samples": 200,
7
+ "total_epochs": 5,
8
+ "final_loss": 0.2465
9
+ },
10
+ "training_history": [
11
+ {"epoch": 1, "loss": 1.2456, "epsilon": 1.0, "avg_reward": 0.2},
12
+ {"epoch": 2, "loss": 0.8923, "epsilon": 0.995, "avg_reward": 0.35},
13
+ {"epoch": 3, "loss": 0.6541, "epsilon": 0.990, "avg_reward": 0.48},
14
+ {"epoch": 4, "loss": 0.4127, "epsilon": 0.985, "avg_reward": 0.62},
15
+ {"epoch": 5, "loss": 0.2465, "epsilon": 0.980, "avg_reward": 0.75}
16
+ ],
17
+ "q_network_config": {
18
+ "state_dim": 64,
19
+ "action_dim": 10,
20
+ "hidden_dim": 128,
21
+ "learning_rate": 0.001,
22
+ "gamma": 0.95,
23
+ "epsilon_start": 1.0,
24
+ "epsilon_end": 0.01,
25
+ "epsilon_decay": 0.995
26
+ },
27
+ "actions": [
28
+ "what_is_backpropagation",
29
+ "why_gradient_descent",
30
+ "how_overfitting_works",
31
+ "explain_regularization",
32
+ "what_loss_function",
33
+ "how_optimization_works",
34
+ "explain_learning_rate",
35
+ "what_regularization",
36
+ "how_batch_norm_works",
37
+ "explain_softmax"
38
+ ],
39
+ "sample_predictions": [
40
+ {
41
+ "scenario": "beginner_ml_student",
42
+ "state_summary": {
43
+ "progress": 0.3,
44
+ "confusion_signals": 3.0,
45
+ "gesture_signals": 2.0
46
+ },
47
+ "prediction": "what_is_backpropagation",
48
+ "confidence": 0.72
49
+ },
50
+ {
51
+ "scenario": "advanced_struggling",
52
+ "state_summary": {
53
+ "progress": 0.7,
54
+ "confusion_signals": 4.5,
55
+ "gesture_signals": 8.0
56
+ },
57
+ "prediction": "how_overfitting_works",
58
+ "confidence": 0.85
59
+ },
60
+ {
61
+ "scenario": "quick_learner",
62
+ "state_summary": {
63
+ "progress": 0.9,
64
+ "confusion_signals": 0.5,
65
+ "gesture_signals": 3.0
66
+ },
67
+ "prediction": "explain_softmax",
68
+ "confidence": 0.45
69
+ }
70
+ ],
71
+ "limitations": [
72
+ "Trained on 200 synthetic samples",
73
+ "Limited real-world behavioral data",
74
+ "No hyperparameter tuning performed",
75
+ "Requires MediaPipe for gesture recognition"
76
+ ],
77
+ "recommended_next_steps": [
78
+ "Collect real learning session data",
79
+ "Increase training samples to 10000+",
80
+ "Add hyperparameter optimization",
81
+ "Implement online learning"
82
+ ]
83
+ }