diff --git a/.gitignore b/.gitignore index bab5ad8be4..3a4cdbeb2b 100644 --- a/.gitignore +++ b/.gitignore @@ -27,4 +27,6 @@ docs/source/generated # IDEs and Python venv .idea .venv -.vscode \ No newline at end of file +.vscode + +dataset/* diff --git a/graphstorm_job.sh b/graphstorm_job.sh old mode 100644 new mode 100755 diff --git a/python/graphstorm/data/ogbn_datasets.py b/python/graphstorm/data/ogbn_datasets.py index f658477bef..1c51a48ea8 100644 --- a/python/graphstorm/data/ogbn_datasets.py +++ b/python/graphstorm/data/ogbn_datasets.py @@ -86,7 +86,7 @@ def __init__(self, raw_dir, dataset, edge_pct=1, self._num_classes = 47 elif dataset == "ogbn-arxiv": self._num_classes = 40 - elif dataset == "ogbn-papers100M": + elif dataset == "ogbn-papers100M" or dataset == "ogbn-papers100m": self._num_classes = 172 self.retain_original_features = retain_original_features self.lm_model_name=lm_model_name diff --git a/tools/partition_graph.py b/tools/partition_graph.py index 132c73a894..d31da5a808 100644 --- a/tools/partition_graph.py +++ b/tools/partition_graph.py @@ -121,7 +121,8 @@ retain_original_features=args.retain_original_features, max_sequence_length=args.max_seq_length, lm_model_name=args.lm_model_name) - elif args.dataset == 'ogbn-papers100m': + elif args.dataset == 'ogbn-papers100M' or args.dataset == 'ogbn-papers100m': + args.dataset = 'ogbn-papers100M' dataset = OGBTextFeatDataset(args.filepath, dataset=args.dataset, retain_original_features=args.retain_original_features, max_sequence_length=args.max_seq_length,