Spaces:

ycwhencpp
/

final-iteration

Paused

App Files Files Community

vaibhav12332112312 commited on 12 days ago

Commit

f0a8734

1 Parent(s): e82b235

update

Browse files

Files changed (2) hide show

server/viraltest_environment.py +15 -3
train-bhai-train +0 -1

server/viraltest_environment.py CHANGED Viewed

@@ -163,6 +163,7 @@ WEEKLY_FATIGUE_MULT = 0.75
 SATURATION_PENALTY_K = 0.25
 TREND_DEFAULT_HALFLIFE_HOURS = 60
 # Collab reward shaping (Later 2023 reach study, HypeAuditor 2024 niche affinity, Rival IQ 2025 overlap patterns,
 # Cen et al. 2024 disengagement model for diminishing returns instead of a hard cap).
 COLLAB_REACH_K = 0.60      # cross-audience exposure: capped reach uplift when overlap is 0
@@ -1006,8 +1007,13 @@ class ViraltestEnvironment(Environment):
     def _is_topic_trending(self, topic: Optional[str]) -> bool:
         if not topic:
             return False
-        topic_lower = topic.lower()
-        return any(t.lower() in topic_lower for t in self._trending_topics)
     # ----- reward -----
@@ -1038,7 +1044,13 @@ class ViraltestEnvironment(Environment):
             comp_component = min(1.0, diff / 1.3) * 0.15
         burnout_penalty = 0.1 if self._energy < 0.2 else 0.0
-        raw = eng_component + energy_component + consistency_component + tag_component + comp_component - burnout_penalty
         return max(0.0, min(1.0, raw))
     def _compute_rest_reward(self) -> float:

 SATURATION_PENALTY_K = 0.25
 TREND_DEFAULT_HALFLIFE_HOURS = 60
+TREND_MATCH_STOPWORDS = {"tips", "guide", "review", "routine", "ideas", "hacks", "tutorial", "the", "a", "an", "and", "of", "for", "to"}
 # Collab reward shaping (Later 2023 reach study, HypeAuditor 2024 niche affinity, Rival IQ 2025 overlap patterns,
 # Cen et al. 2024 disengagement model for diminishing returns instead of a hard cap).
 COLLAB_REACH_K = 0.60      # cross-audience exposure: capped reach uplift when overlap is 0
     def _is_topic_trending(self, topic: Optional[str]) -> bool:
         if not topic:
             return False
+        t_words = set(topic.lower().split()) - TREND_MATCH_STOPWORDS
+        if not t_words:
+            return False
+        for trend in self._trending_topics:
+            if t_words & (set(trend.lower().split()) - TREND_MATCH_STOPWORDS):
+                return True
+        return False
     # ----- reward -----
             comp_component = min(1.0, diff / 1.3) * 0.15
         burnout_penalty = 0.1 if self._energy < 0.2 else 0.0
+        is_post = sa.action_type == "post"
+        trending_topic_mult = 1.5 if is_post and self._is_topic_trending(sa.topic) else 1.0
+        peak_hour_mult = 1.3 if is_post and self._get_hour_multiplier() >= 1.2 else 1.0
+        raw = (
+            (eng_component + tag_component + comp_component) * trending_topic_mult * peak_hour_mult
+            + energy_component + consistency_component - burnout_penalty
+        )
         return max(0.0, min(1.0, raw))
     def _compute_rest_reward(self) -> float:

train-bhai-train DELETED Viewed

	@@ -1 +0,0 @@
1	- Subproject commit ce11257dc34d8f8dbb36445cf834f89852539088