Update data/download_wudao.sh

This commit is contained in:
Namhyeon Go 2024-06-14 09:08:03 +00:00
parent 0157b6938d
commit 5635f7d08d

View File

@ -9,6 +9,7 @@
# download wudao dataset and preprocess
# Copyright (c) 2023 by s-JoL(sl12160010@gmail.com), All Rights Reserved.
###
apt-add-repository multiverse
apt install unrar
wget -v -c 'https://download.scidb.cn/download?fileId=63a30383fed6a8a9e8454302&dataSetType=organization&fileName=WuDaoCorporaText-2.0-open.rar' -O data/WuDaoCorpus2.0_base_200G.rar