Skip to content

Commit

Permalink
use faster AWS link by DGL
Browse files Browse the repository at this point in the history
  • Loading branch information
weihua916 committed Sep 29, 2021
1 parent 287b56d commit ba5506c
Show file tree
Hide file tree
Showing 4 changed files with 8 additions and 12 deletions.
5 changes: 2 additions & 3 deletions ogb/lsc/pcqm4mv2.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,10 +30,9 @@ def __init__(self, root = 'dataset', smiles2graph = smiles2graph, only_smiles=Fa

# Old url hosted at Stanford
# md5sum: 65b742bafca5670be4497499db7d361b
self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# New url hosted by DGL team at AWS--much faster to download
# (TODO) chagne the DGL link
# self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m_kddcup2021.zip'
self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m-v2.zip'

# check version and update if necessary
if osp.isdir(self.folder) and (not osp.exists(osp.join(self.folder, f'RELEASE_v{self.version}.txt'))):
Expand Down
5 changes: 2 additions & 3 deletions ogb/lsc/pcqm4mv2_dgl.py
Original file line number Diff line number Diff line change
Expand Up @@ -27,10 +27,9 @@ def __init__(self, root = 'dataset', smiles2graph = smiles2graph):

# Old url hosted at Stanford
# md5sum: 65b742bafca5670be4497499db7d361b
self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# New url hosted by DGL team at AWS--much faster to download
# (TODO) chagne the DGL link
# self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m_kddcup2021.zip'
self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m-v2.zip'

# check version and update if necessary
if osp.isdir(self.folder) and (not osp.exists(osp.join(self.folder, f'RELEASE_v{self.version}.txt'))):
Expand Down
5 changes: 2 additions & 3 deletions ogb/lsc/pcqm4mv2_pyg.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,10 +28,9 @@ def __init__(self, root = 'dataset', smiles2graph = smiles2graph, transform=None

# Old url hosted at Stanford
# md5sum: 65b742bafca5670be4497499db7d361b
self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# self.url = f'http://ogb-data.stanford.edu/data/lsc/pcqm4m-v2.zip'
# New url hosted by DGL team at AWS--much faster to download
# (TODO) chagne the DGL link
# self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m_kddcup2021.zip'
self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/pcqm4m-v2.zip'

# check version and update if necessary
if osp.isdir(self.folder) and (not osp.exists(osp.join(self.folder, f'RELEASE_v{self.version}.txt'))):
Expand Down
5 changes: 2 additions & 3 deletions ogb/lsc/wikikg90mv2.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,10 +20,9 @@ def __init__(self, root: str = 'dataset'):

# Old url hosted at Stanford
# md5sum: bfd6257134b7eb59e2edc0a4af21faa8
self.url = 'http://ogb-data.stanford.edu/data/lsc/wikikg90m-v2.zip'
# self.url = 'http://ogb-data.stanford.edu/data/lsc/wikikg90m-v2.zip'
# New url hosted by DGL team at AWS--much faster to download
# (TODO) change the DGL link
# self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/wikikg90m_kddcup2021.zip'
self.url = 'https://dgl-data.s3-accelerate.amazonaws.com/dataset/OGB-LSC/wikikg90m-v2.zip'

self.processed_dir = osp.join(self.folder, 'processed')

Expand Down

0 comments on commit ba5506c

Please sign in to comment.