cjc0013 commited on
Commit
2c4c360
·
verified ·
1 Parent(s): 7705bfb

Clarify why the release matters in plain English

Browse files
Files changed (2) hide show
  1. public_copy.json +1 -1
  2. public_space_app.py +33 -14
public_copy.json CHANGED
@@ -4,7 +4,7 @@
4
  "subtitle": "Neutral Records explorer for a public-record slice of congressional money-and-power linkages.",
5
  "dataset_repo_id": "cjc0013/cmp-data",
6
  "space_repo_id": "cjc0013/cmp",
7
- "welcome_markdown": "# Congress Public Records Slice\n\nStart with **What This Is**, then use **Overview**.\n\n- **What This Is** explains, in plain English, what this release contains and what it does not claim.\n- Pick one House member first.\n- Use **Overview** to see the strongest sectors or funding recipients for that member.\n- Use **Explain Link** to see why one relationship appears in this released slice.\n- Use **Explore Graph** only if you want a secondary visual map.\n\nThis is an exploration tool, not an accusation tool.",
8
  "landing_markdown": "# Congress Public Records Slice\n\nA neutral, review-oriented slice of House public-record linkages across financial disclosures, sector overlap, and community project funding recipient relationships.\n\n- This release is a slice of public-record data, not a complete accounting of all potentially relevant data.\n- Future releases may update or expand this slice as source recovery, parsing, and evidence linkage improve.\n- This release does not assign guilt, wrongdoing, intent, or causality to any person or organization.\n- The release shows public-record overlaps, timing, and linkage strength, not proof of illegality or corruption.\n- Some rows remain review-tier or include unresolved official source references and should be read with those labels in mind.\n- The public package includes verification summaries and SHA-backed artifact indexes, but it does not include the full internal raw corpus, so external verification is bounded by what is published here.",
9
  "downloads_markdown": "## Downloads\n\n- Dataset repo id: `cjc0013/cmp-data`\n- Space repo id: `cjc0013/cmp`\n\nUse the dataset bundle files for direct review, CSV download, and SHA-backed source checks.",
10
  "dataset_bundle_prefix": "dataset_bundle"
 
4
  "subtitle": "Neutral Records explorer for a public-record slice of congressional money-and-power linkages.",
5
  "dataset_repo_id": "cjc0013/cmp-data",
6
  "space_repo_id": "cjc0013/cmp",
7
+ "welcome_markdown": "# Congress Public Records Slice\n\nStart with **Start Here**, then use **Overview**.\n\n- **Start Here** explains what this release is, why somebody would care, and what data is in it.\n- Pick one House member first.\n- Use **Overview** to see the strongest sectors or funding recipients for that member.\n- Use **Explain Link** to see why one relationship appears in this released slice.\n- Use **Explore Graph** only if you want a secondary visual map.\n\nThis is an exploration tool, not an accusation tool.",
8
  "landing_markdown": "# Congress Public Records Slice\n\nA neutral, review-oriented slice of House public-record linkages across financial disclosures, sector overlap, and community project funding recipient relationships.\n\n- This release is a slice of public-record data, not a complete accounting of all potentially relevant data.\n- Future releases may update or expand this slice as source recovery, parsing, and evidence linkage improve.\n- This release does not assign guilt, wrongdoing, intent, or causality to any person or organization.\n- The release shows public-record overlaps, timing, and linkage strength, not proof of illegality or corruption.\n- Some rows remain review-tier or include unresolved official source references and should be read with those labels in mind.\n- The public package includes verification summaries and SHA-backed artifact indexes, but it does not include the full internal raw corpus, so external verification is bounded by what is published here.",
9
  "downloads_markdown": "## Downloads\n\n- Dataset repo id: `cjc0013/cmp-data`\n- Space repo id: `cjc0013/cmp`\n\nUse the dataset bundle files for direct review, CSV download, and SHA-backed source checks.",
10
  "dataset_bundle_prefix": "dataset_bundle"
public_space_app.py CHANGED
@@ -109,15 +109,26 @@ def _about_release_markdown(
109
  [
110
  "## What this is",
111
  "",
112
- "This tool is a public-records explorer for one released slice of House data.",
113
  "",
114
- "It brings together records about House members, financial disclosures, legislative activity, lobbying visibility, and some community project funding recipient relationships.",
115
  "",
116
- "The goal is simple: help you inspect where public records overlap, then click through to the published source URLs and SHA-backed artifacts.",
117
  "",
118
- "It does **not** accuse anyone of a crime, corruption, or wrongdoing.",
119
- "It does **not** prove intent or causality.",
120
- "It does **not** claim this is the full universe of relevant data.",
 
 
 
 
 
 
 
 
 
 
 
121
  "",
122
  "## What is in this release",
123
  "",
@@ -150,10 +161,18 @@ def _data_used_markdown(manifest: Dict[str, Any]) -> str:
150
  [
151
  "## What data is used here",
152
  "",
153
- "This release uses public records from these source groups:",
154
  "",
155
  *[f"- {item}" for item in source_groups],
156
  "",
 
 
 
 
 
 
 
 
157
  "## How those records show up in this release",
158
  "",
159
  "- `members.csv`: one row per House member in this slice.",
@@ -169,15 +188,15 @@ def _data_used_markdown(manifest: Dict[str, Any]) -> str:
169
  def _how_to_use_markdown() -> str:
170
  return "\n".join(
171
  [
172
- "## How to read this",
173
  "",
174
  "1. Pick one House member.",
175
- "2. Start in **Overview** and look at the top sectors or funding recipients.",
176
- "3. Click a relationship in **Relationship to explain**.",
177
- "4. Read the evidence breakdown and the coarse evidence window.",
178
- "5. Use the source URLs and SHA-backed artifacts if you want to verify it yourself.",
179
  "",
180
- "The safest way to interpret this release is as a map of documented public-record relationships, not a verdict.",
181
  ]
182
  )
183
 
@@ -907,7 +926,7 @@ def build_app(copy_path: str | Path):
907
 
908
  with gr.Blocks(title=copy_payload.get("title", "Congress Public Records Slice")) as app:
909
  gr.Markdown(copy_payload.get("welcome_markdown", copy_payload.get("landing_markdown", "")))
910
- with gr.Tab("What This Is"):
911
  gr.Markdown(_about_release_markdown(manifest, data["recipient_link_quality"], data["source_quality"]))
912
  gr.Markdown(_data_used_markdown(manifest))
913
  gr.Markdown(_how_to_use_markdown())
 
109
  [
110
  "## What this is",
111
  "",
112
+ "This tool helps you answer a simple question:",
113
  "",
114
+ "**Do a House member's disclosed financial or funding-related relationships line up with public legislative activity in the same area?**",
115
  "",
116
+ "It does that by putting several public-record systems in one place, then ranking the strongest overlaps for one House member at a time.",
117
  "",
118
+ "The point is not to tell you what to think. The point is to make it faster to inspect patterns and then verify the underlying records yourself.",
119
+ "",
120
+ "## Why someone might care",
121
+ "",
122
+ "- Journalists can use it to move from a vague suspicion to a concrete set of records worth checking.",
123
+ "- Researchers can use it to compare members, sectors, and funding-recipient patterns without pulling six public sources by hand.",
124
+ "- Citizens can use it to see why a relationship appears, then open the actual published source URLs and SHA-backed artifacts.",
125
+ "",
126
+ "## What this does not claim",
127
+ "",
128
+ "- It does **not** accuse anyone of a crime, corruption, or wrongdoing.",
129
+ "- It does **not** prove intent or causality.",
130
+ "- It does **not** claim this is the full universe of relevant data.",
131
+ "- It shows overlaps and evidence strength, not a verdict.",
132
  "",
133
  "## What is in this release",
134
  "",
 
161
  [
162
  "## What data is used here",
163
  "",
164
+ "This release combines public records from these source groups:",
165
  "",
166
  *[f"- {item}" for item in source_groups],
167
  "",
168
+ "## In plain English, what those sources add",
169
+ "",
170
+ "- Disclosure records show trades or financial holdings.",
171
+ "- Bill and vote records show legislative activity in related policy areas.",
172
+ "- Committee records show formal committee context.",
173
+ "- Lobbying and campaign-finance visibility add more public context around the same issue areas.",
174
+ "- Community project funding records and award pages help show recipient-side relationships.",
175
+ "",
176
  "## How those records show up in this release",
177
  "",
178
  "- `members.csv`: one row per House member in this slice.",
 
188
  def _how_to_use_markdown() -> str:
189
  return "\n".join(
190
  [
191
+ "## Best way to use this",
192
  "",
193
  "1. Pick one House member.",
194
+ "2. Start in **Overview** and look at the top sectors or funding recipients for that person.",
195
+ "3. Pick one relationship in **Relationship to explain**.",
196
+ "4. Read the plain-English reasons and the coarse evidence window.",
197
+ "5. If it looks interesting, open the source URLs and SHA-backed artifacts to verify it yourself.",
198
  "",
199
+ "A good rule of thumb: treat this as a lead generator for public-record review, not as a conclusion machine.",
200
  ]
201
  )
202
 
 
926
 
927
  with gr.Blocks(title=copy_payload.get("title", "Congress Public Records Slice")) as app:
928
  gr.Markdown(copy_payload.get("welcome_markdown", copy_payload.get("landing_markdown", "")))
929
+ with gr.Tab("Start Here"):
930
  gr.Markdown(_about_release_markdown(manifest, data["recipient_link_quality"], data["source_quality"]))
931
  gr.Markdown(_data_used_markdown(manifest))
932
  gr.Markdown(_how_to_use_markdown())