Skip to content

Commit fcfe25b

Browse files
J03D03claude
andcommitted
Split load and transform steps in examples for readability
Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
1 parent e1b70ea commit fcfe25b

3 files changed

Lines changed: 7 additions & 3 deletions

File tree

‎examples/04_enrich_with_commit_data.py‎

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,5 +9,6 @@
99

1010
if __name__ == "__main__":
1111
# Devign contains only 2 projects (FFmpeg, QEMU).
12-
entries = transformations.add_commit_information_local(vfc_datasets.DevignDataset())
12+
entries = vfc_datasets.DevignDataset()
13+
entries = transformations.add_commit_information_local(entries)
1314
log_dataset_stats(entries)

‎examples/06_create_splits.py‎

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,10 @@
99
setup_logging("create_splits")
1010

1111
if __name__ == "__main__":
12+
entries = vfc_datasets.DevignDataset()
13+
1214
create_random_split(
13-
vfc_datasets.DevignDataset(),
15+
entries,
1416
name="devign",
1517
output_path=Path(".data/splits"),
1618
seed=42,

‎examples/07_filter_by_language.py‎

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,8 @@
1010
logger = logging.getLogger(__name__)
1111

1212
if __name__ == "__main__":
13-
entries = transformations.add_commit_information_local(vfc_datasets.DevignDataset())
13+
entries = vfc_datasets.DevignDataset()
14+
entries = transformations.add_commit_information_local(entries)
1415

1516
logger.info("Entries before filtering: %d", len(entries))
1617
entries = transformations.filter_by_extension(entries, {"c", "h", "cpp", "hpp", "cc"})

0 commit comments

Comments
 (0)