Skip to content

Commit b1ac936

Browse files
created windows_download_dataset.sh, deleted original changes in download_dataset.sh
1 parent 18ff1a7 commit b1ac936

File tree

2 files changed

+35
-37
lines changed

2 files changed

+35
-37
lines changed
Lines changed: 0 additions & 37 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,3 @@
1-
# MacOS 系统下载方式
21
#!/bin/bash
32

43
# 设置环境变量
@@ -19,39 +18,3 @@ huggingface-cli download \
1918
--resume-download \
2019
BelleGroup/train_3.5M_CN \
2120
--local-dir "${dataset_dir}/BelleGroup"
22-
23-
# Windows下载方式
24-
# 使用PowerShell下载
25-
# 暂时为当前PowerShell界面设置环境,关闭Powershell环境自动消失
26-
$env:HF_ENDPOINT = "https://hf-mirror.com"
27-
28-
# 将\path\to\your\dataset替换成想要下载dataset目录地址
29-
$dataset_dir = "\path\to\your\dataset"
30-
31-
# 需要预先安装modelscope,使用pip install modelscope安装
32-
modelscope download --dataset ddzhu123/seq-monkey mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2 --local_dir "$dataset_dir"
33-
34-
tar -xvf "$dataset_dir\mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2" -C "$dataset_dir"
35-
36-
huggingface-cli download `
37-
--repo-type dataset `
38-
--resume-download `
39-
BelleGroup/train_3.5M_CN `
40-
--local-dir "$dataset_dir\BelleGroup"
41-
42-
# 使用CMD下载
43-
# 暂时为当前CMD界面设置环境,关闭CMD环境自动消失
44-
set HF_ENDPOINT=https://hf-mirror.com
45-
46-
# 将\path\to\your\dataset替换成想要下载dataset目录地址
47-
set dataset_dir=\path\to\your\dataset
48-
49-
modelscope download --dataset ddzhu123/seq-monkey mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2 --local_dir %dataset_dir%
50-
51-
tar -xvf "%dataset_dir%\mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2" -C "%dataset_dir%"
52-
53-
huggingface-cli download ^
54-
--repo-type dataset ^
55-
--resume-download ^
56-
BelleGroup/train_3.5M_CN ^
57-
--local-dir "%dataset_dir%\BelleGroup"
Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,35 @@
1+
# Windows下载方式
2+
# 使用PowerShell下载
3+
# 暂时为当前PowerShell界面设置环境,关闭Powershell环境自动消失
4+
$env:HF_ENDPOINT = "https://hf-mirror.com"
5+
6+
# 将\path\to\your\dataset替换成想要下载dataset目录地址
7+
$dataset_dir = "\path\to\your\dataset"
8+
9+
# 需要预先安装modelscope,使用pip install modelscope安装
10+
modelscope download --dataset ddzhu123/seq-monkey mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2 --local_dir "$dataset_dir"
11+
12+
tar -xvf "$dataset_dir\mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2" -C "$dataset_dir"
13+
14+
huggingface-cli download `
15+
--repo-type dataset `
16+
--resume-download `
17+
BelleGroup/train_3.5M_CN `
18+
--local-dir "$dataset_dir\BelleGroup"
19+
20+
# 使用CMD下载
21+
# 暂时为当前CMD界面设置环境,关闭CMD环境自动消失
22+
set HF_ENDPOINT=https://hf-mirror.com
23+
24+
# 将\path\to\your\dataset替换成想要下载dataset目录地址
25+
set dataset_dir=\path\to\your\dataset
26+
27+
modelscope download --dataset ddzhu123/seq-monkey mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2 --local_dir %dataset_dir%
28+
29+
tar -xvf "%dataset_dir%\mobvoi_seq_monkey_general_open_corpus.jsonl.tar.bz2" -C "%dataset_dir%"
30+
31+
huggingface-cli download ^
32+
--repo-type dataset ^
33+
--resume-download ^
34+
BelleGroup/train_3.5M_CN ^
35+
--local-dir "%dataset_dir%\BelleGroup"

0 commit comments

Comments
 (0)