1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
|
- local bd = import '../lib.jsonnet';
- {
- 'scan-book-info': {
- cmd: bd.cmd('goodreads scan books ../data/goodreads/goodreads_books.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_books.json.gz',
- ],
- outs: [
- 'gr-book-ids.parquet',
- 'gr-book-info.parquet',
- 'gr-book-authors.parquet',
- 'gr-book-series.parquet',
- ],
- },
- 'scan-work-info': {
- cmd: bd.cmd('goodreads scan works ../data/goodreads/goodreads_book_works.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_book_works.json.gz',
- ],
- outs: [
- 'gr-work-info.parquet',
- ],
- },
- 'scan-book-genres': {
- cmd: bd.cmd('goodreads scan genres ../data/goodreads/goodreads_book_genres_initial.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_book_genres_initial.json.gz',
- ],
- outs: [
- 'gr-book-genres.parquet',
- 'gr-genres.parquet',
- ],
- },
- 'scan-author-info': {
- cmd: bd.cmd('goodreads scan authors ../data/goodreads/goodreads_book_authors.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_book_authors.json.gz',
- ],
- outs: [
- 'gr-author-info.parquet',
- ],
- },
- 'scan-interactions': {
- cmd: bd.cmd('goodreads scan interactions ../data/goodreads/goodreads_interactions.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_interactions.json.gz',
- ],
- outs: [
- 'gr-interactions.parquet',
- 'gr-users.parquet',
- ],
- },
- } + if bd.config.goodreads.reviews then {
- 'scan-reviews': {
- cmd: bd.cmd('goodreads scan reviews ../data/goodreads/goodreads_reviews_dedup.json.gz'),
- deps: [
- '../src/cli/goodreads',
- '../src/goodreads',
- '../data/goodreads/goodreads_reviews_dedup.json.gz',
- 'gr-book-link.parquet',
- 'gr-users.parquet',
- ],
- outs: [
- 'gr-reviews.parquet',
- ],
- },
- } else {}
|