mirror of
https://github.com/openai/gpt-2-output-dataset
synced 2025-08-22 09:58:07 +00:00
move to azure
This commit is contained in:
parent
ddfecb3932
commit
d6f4e2956b
@ -17,7 +17,7 @@ for ds in [
|
|||||||
]:
|
]:
|
||||||
for split in ['train', 'valid', 'test']:
|
for split in ['train', 'valid', 'test']:
|
||||||
filename = ds + "." + split + '.jsonl'
|
filename = ds + "." + split + '.jsonl'
|
||||||
r = requests.get("https://storage.googleapis.com/gpt-2/output-dataset/v1/" + filename, stream=True)
|
r = requests.get("https://openaipublic.blob.core.windows.net/gpt-2/output-dataset/v1/" + filename, stream=True)
|
||||||
|
|
||||||
with open(os.path.join(subdir, filename), 'wb') as f:
|
with open(os.path.join(subdir, filename), 'wb') as f:
|
||||||
file_size = int(r.headers["content-length"])
|
file_size = int(r.headers["content-length"])
|
||||||
|
Loading…
x
Reference in New Issue
Block a user