Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

gulpfile.js 2.4 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
  1. const fs = require('fs');
  2. const gulp = require('gulp');
  3. const cp = require('child_process');
  4. const miss = require('mississippi');
  5. const Promise = require('bluebird');
  6. const log = require('gulplog');
  7. const args = require('minimist')(process.argv.slice(2));
  8. const olimport = require('./lib/ol-import');
  9. const lkexport = require('./lib/lkexport');
  10. const grimport = require('./lib/goodreads')
  11. const olDate = args['ol-date'] || '2017-10-01';
  12. exports.importAuthors = () => olimport.authors(olDate);
  13. exports.importWorks = () => olimport.works(olDate);
  14. exports.importEditions = () => olimport.editions(olDate);
  15. exports.importOpenLib = gulp.parallel(
  16. exports.importAuthors,
  17. exports.importWorks,
  18. exports.importEditions
  19. );
  20. exports.importOpenLib.description = 'Import all OpenLib data';
  21. exports.importAmazon = function() {
  22. return cp.spawn('psql', ['-c', "\\copy az_raw_ratings FROM 'data/ratings_Books.csv' WITH CSV"], {
  23. stdio: ['ignore', process.stdout, process.stderr]
  24. });
  25. };
  26. exports.importGoodReads = gulp.parallel(
  27. grimport.importAuthors, grimport.importBooks, grimport.importWorks,
  28. grimport.importInteractions
  29. );
  30. exports.importBX = function() {
  31. const bxi = require('./lib/bximport');
  32. return bxi('data/BX-Book-Ratings.csv');
  33. };
  34. exports.importVIAF = function() {
  35. var viaf = require('./lib/viaf-import');
  36. return viaf.import('data/viaf-20180401-clusters-marc21.xml.gz');
  37. };
  38. exports.importLOC = function() {
  39. var loc = require('./lib/loc-import');
  40. return loc.import('data/LOC/BooksAll.*.gz');
  41. };
  42. exports.indexLOC = function() {
  43. return new Promise((ok, fail) => {
  44. let script = fs.createReadStream('loc-index.sql');
  45. script.on('open', () => {
  46. let p = cp.spawn('psql', [], {
  47. stdio: [script, process.stdout, process.stderr]
  48. });
  49. p.on('exit', (code, sig) => {
  50. if (sig) fail(new Error('psql exited with signal ' + sig));
  51. else if (code) fail(new Error('psql exited with code ' + code));
  52. else ok();
  53. });
  54. p.on('error', fail);
  55. });
  56. });
  57. };
  58. exports.export = gulp.series(
  59. function mkdir(cb) {
  60. fs.mkdir('out', (err) => {
  61. if (err && err.code != 'EEXIST') {
  62. cb(err);
  63. } else {
  64. cb();
  65. }
  66. })
  67. },
  68. gulp.parallel(
  69. function amazon() { return lkexport.amazon('out/az-ratings.csv') },
  70. function bxAll() { return lkexport.bxAll('out/bx-implicit.csv') },
  71. function bxExplicit() { return lkexport.bxExplicit('out/bx-ratings.csv') }
  72. ));
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...