项目作者: nodef

项目描述 :
Crawl Wikipedia pages and upload TTS to Youtube.
高级语言: JavaScript
项目地址: git://github.com/nodef/wikipedia-tts.git
创建时间: 2018-10-05T05:54:49Z
项目社区:https://github.com/nodef/wikipedia-tts

开源协议:MIT License

下载


Crawl Wikipedia pages and upload TTS to YouTube.

Do you want to:

setup

  1. Install Node.js, if not installed.
  2. Run npm install -g wikipedia-tts in console.
  3. To install this as a package use npm install wikipedia-tts.
  4. Follow setup at extra-googletts.
  5. Follow setup at extra-youtubeuploader.

console

  1. wikipedia-tts <command> [page] [options]
  2. # --help: show this help
  3. # -l, --log: enable log
  4. # -o, --output: set output file
  5. # -d, --db: set crawl database file (crawl.db)
  6. # -p, --priority: set page priority (0)
  7. # -r, --references: set page references (0)
  8. # -s, --status: set page status (0)
  9. # -t, --times: times to crawl/upload (1)
  10. # Environment variables:
  11. # WIKIPEDIATTS_LOG: enable logging (0)
  12. # WIKIPEDIATTS_DB: crawl database file (crawl.db)
  13. wikipedia-tts "Ladakh"
  14. # "Ladakh" is uploaded to YouTube
  15. wikipedia-tts add "Plant nutrition"
  16. # "Plant nutrition" is added to crawl list
  17. wikipedia-tts update "Plant nutrition" --priority 1
  18. # "Plant nutrition" priority is set to 1
  19. # this means it will be crawled/uploaded first
  20. # even if other pages have higher number of references
  21. wikipedia-tts crawl
  22. # "Plant nutrition" is page links are crawled
  23. # this is because it is on top priority, references
  24. wikipedia-tts crawl --times 10
  25. # Crawling done recursively 10 times
  26. wikipedia-tts upload
  27. # Highest ranking page is crawled and uploaded to YouTube
  28. wikipedia-tts upload --times 10
  29. # Uploading done recursively 10 times

package

  1. const wikipediaTts = require('wikipedia-tts');
  2. // wikipediaTts.setup([db path]): db conn (promise)
  3. // wikipediaTts.get<db>, <page>): {title, priority, references, status} (promise)
  4. // wikipediaTts.add(<db>, <page>): page (promise)
  5. // wikipediaTts.remove(<db>, <page>): page (promise)
  6. // wikipediaTts.update(<db>, <page>, [value]): page (promise)
  7. // wikipediaTts.crawl(<db>, [options]): times crawled (promise)
  8. // wikipediaTts.upload(<db>, [options]): times uploaded (promise)
  9. // wikipediaTts(<output>, <page>, [options]): Upload page to YouTube
  10. // -> <wikijs page> (promise)
  11. /* More options: @wikipedia-tts/youtube */
  12. // [options]: {
  13. // db: $WIKIPEDIATTS_DB||'crawl.db',
  14. // input: {
  15. // text: null,
  16. // image: null,
  17. // tags: null,
  18. // description: null
  19. // }
  20. // }
  21. wikipediaTts(null, 'Ladakh');
  22. // "Ladakh" is uploaded to youtube
  23. var db = await wikipediaTts.setup();
  24. // crawl list is created (crawl.db)
  25. await wikipediaTts.add(db, 'Plant nutrition');
  26. // "Plant nutrition" is added to crawl list
  27. await wikipediaTts.update(db, 'Plant nutrition', {priority: 1});
  28. // "Plant nutrition" priority is set to 1
  29. // this means it will be crawled/uploaded first
  30. // even if other pages have higher number of references
  31. await wikipediaTts.crawl(db);
  32. // "Plant nutrition" is page links are crawled
  33. // this is because it is on top priority, references
  34. await wikipediaTts.crawl(db, {times: 10});
  35. // Crawling done recursively 10 times
  36. await wikipediaTts.upload(db);
  37. // Highest ranking page is crawled and uploaded to YouTube
  38. await wikipediaTts.crawl(db, {times: 10});
  39. // Uploading done recursively 10 times

wikipedia-tts