Generate artifact-evaluation results.md files for sysartifacts and secartifacts sites.
This is the unified entry point for generating results pages for both
- sysartifacts.github.io (USENIX systems conferences: FAST, OSDI, ATC, NSDI)
- secartifacts.github.io (security conferences: USENIX Security, ACSAC)
The --target flag selects the output format (badge images, Liquid template).
The --conference flag selects which scraper to use.
Usage
sysartifacts: FAST 2025
python -m src.scrapers.generate_results --target sysartifacts --conference fast --years 2025
sysartifacts: OSDI 2024 with custom dir prefix
python -m src.scrapers.generate_results --target sysartifacts --conference osdi --years 2024 --dir-prefix osdi
secartifacts: ACSAC 2025
python -m src.scrapers.generate_results --target secartifacts --conference acsac --years 2025
secartifacts: USENIX Security 2025
python -m src.scrapers.generate_results --target secartifacts --conference usenixsec --years 2025
Preview without writing
python -m src.scrapers.generate_results --target secartifacts --conference acsac --years 2025 --dry-run
Requirements
pip install requests beautifulsoup4 pyyaml lxml
Output: //results.md (and organizers.md when available)
scrape_artifacts(config, year, **kwargs)
Dispatch to the appropriate scraper.
Returns list of dicts with: title, badges (list[str]), artifact_urls (list[str]), paper_url (str).
Source code in src/scrapers/generate_results.py
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184 | def scrape_artifacts(config, year, **kwargs):
"""
Dispatch to the appropriate scraper.
Returns list of dicts with: title, badges (list[str]), artifact_urls (list[str]), paper_url (str).
"""
scraper = config["scraper"]
if scraper == "acsac":
from .acsac_scrape import scrape_acsac_artifacts
return scrape_acsac_artifacts(year)
# All USENIX conferences (fast, osdi, atc, nsdi, usenixsecurity)
from .usenix_scrape import scrape_conference_year
max_workers = kwargs.get("max_workers", 4)
delay = kwargs.get("delay", 0.5)
all_papers = scrape_conference_year(scraper, year, max_workers=max_workers, delay=delay)
# Normalize to common format, keep only papers with badges
artifacts = []
for p in all_papers:
if not p.get("badges"):
continue
artifacts.append(
{
"title": p["title"],
"badges": p["badges"],
"artifact_urls": [],
"paper_url": p.get("paper_url", ""),
}
)
return artifacts
|
scrape_organizers_for(config, year)
Scrape AE committee organizers if supported for this config.
Source code in src/scrapers/generate_results.py
187
188
189
190
191
192
193 | def scrape_organizers_for(config, year):
"""Scrape AE committee organizers if supported for this config."""
if not config.get("scrape_organizers"):
return None
from .usenix_scrape import scrape_organizers
return scrape_organizers(config["scraper"], year)
|
generate_results_md(config, year, artifacts)
Generate a results.md string from config + scraped artifacts.
Source code in src/scrapers/generate_results.py
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262 | def generate_results_md(config, year, artifacts):
"""Generate a results.md string from config + scraped artifacts."""
badge_cols = config["badge_columns"]
badge_labels = config["badge_labels"]
badges_fmt = config["badges_format"]
include_empty = config.get("include_empty_artifact_fields", False)
# Count badges
counts = {b: sum(1 for a in artifacts if b in a["badges"]) for b in badge_cols}
# Build artifact YAML entries
yaml_artifacts = []
for a in artifacts:
entry = {"title": a["title"]}
entry["badges"] = _format_badges(a["badges"], badges_fmt)
# Artifact URLs
if a.get("artifact_urls"):
if len(a["artifact_urls"]) == 1:
entry["artifact_url"] = a["artifact_urls"][0]
else:
entry["artifact_urls"] = a["artifact_urls"]
elif include_empty:
entry["artifact_url"] = ""
if a.get("paper_url"):
entry["paper_url"] = a["paper_url"]
if include_empty:
entry["appendix_url"] = ""
yaml_artifacts.append(entry)
# Front matter
front = {"title": "Results"}
front.update(config["front_matter"])
front["artifacts"] = yaml_artifacts
front_yaml = yaml.dump(front, default_flow_style=False, allow_unicode=True, sort_keys=False, width=120)
# Summary
summary = "\n".join(f"* {counts[b]} {badge_labels[b]}" for b in badge_cols)
# Template
template_name = config["template"]
table = _render_template(template_name, year, badge_cols)
return f"---\n{front_yaml.rstrip()}\n---\n\n**Evaluation Results**:\n\n{summary}\n\n{table}\n"
|
generate_organizers_md(organizers)
Generate organizers.md from scraped organizer data, or None.
Source code in src/scrapers/generate_results.py
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284 | def generate_organizers_md(organizers):
"""Generate organizers.md from scraped organizer data, or None."""
if not organizers or (not organizers.get("chairs") and not organizers.get("members")):
return None
lines = ["---", "title: Organizers", "order: 20", "---", "", "## Artifact Evaluation Committee Co-Chairs", ""]
for chair in organizers.get("chairs", []):
aff = f", {chair['affiliation']}" if chair["affiliation"] else ""
lines.append(f"{chair['name']}{aff} <br>")
lines.extend(["", "## Artifact Evaluation Committee", ""])
members = organizers.get("members", [])
for i, member in enumerate(members):
aff = f", {member['affiliation']}" if member["affiliation"] else ""
suffix = "<br>" if i < len(members) - 1 else ""
lines.append(f"{member['name']}{aff}{suffix}")
return "\n".join(lines) + "\n"
|