download_webnyheter2013.sh 493 B

12345678910111213
  1. # Copyright (c) 2020 NVIDIA Corporation. All rights reserved.
  2. wget http://spraakbanken.gu.se/lb/resurser/meningsmangder/webbnyheter2013.xml.bz2 &&
  3. bunzip2 -d webbnyheter2013.xml.bz2 &&
  4. mv webbnyheter2013.xml ./source_code/ &&
  5. wget https://raw.githubusercontent.com/spraakbanken/sb-nltk-tools/master/sb_corpus_reader.py &&
  6. mv sb_corpus_reader.py ./source_code/ &&
  7. cd ./source_code/ &&
  8. python get_nyheterdata.py &&
  9. echo ls &&
  10. mv webnyheter2013.txt ../dataset/SV/ &&
  11. rm -fr webbnyheter2013.xml