Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 1.7 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
  1. stages:
  2. scan-authors:
  3. cmd: python ../run.py --rust openlib scan-authors ../data/openlib/ol_dump_authors.txt.gz
  4. deps:
  5. - ../src/cli/openlib.rs
  6. - ../src/openlib/
  7. - ../data/openlib/ol_dump_authors.txt.gz
  8. outs:
  9. - authors.parquet
  10. - author-names.parquet
  11. scan-works:
  12. cmd: python ../run.py --rust openlib scan-works ../data/openlib/ol_dump_works.txt.gz
  13. deps:
  14. - ../src/cli/openlib.rs
  15. - ../src/openlib/
  16. - ../data/openlib/ol_dump_works.txt.gz
  17. - authors.parquet
  18. outs:
  19. - works.parquet
  20. - work-authors.parquet
  21. - author-ids-after-works.parquet
  22. scan-editions:
  23. cmd: python ../run.py --rust openlib scan-editions ../data/openlib/ol_dump_editions.txt.gz
  24. deps:
  25. - ../src/cli/openlib.rs
  26. - ../src/openlib/
  27. - ../data/openlib/ol_dump_editions.txt.gz
  28. - authors.parquet
  29. - works.parquet
  30. - author-ids-after-works.parquet
  31. outs:
  32. - editions.parquet
  33. - edition-works.parquet
  34. - edition-isbns.parquet
  35. - edition-authors.parquet
  36. - all-works.parquet
  37. - all-authors.parquet
  38. edition-isbn-ids:
  39. cmd: python ../run.py --rust fusion edition-isbn-ids.tcl
  40. deps:
  41. - edition-isbn-ids.tcl
  42. - edition-isbns.parquet
  43. - ../book-links/all-isbns.parquet
  44. outs:
  45. - edition-isbn-ids.parquet
  46. schema:
  47. foreach:
  48. - authors
  49. - author-names
  50. - works
  51. - work-authors
  52. - editions
  53. - edition-works
  54. - edition-isbns
  55. - edition-authors
  56. - all-works
  57. - all-authors
  58. - edition-isbn-ids
  59. do:
  60. cmd: python ../run.py --rust pq-info -o ${item}.json ${item}.parquet
  61. deps:
  62. - ${item}.parquet
  63. outs:
  64. - ${item}.json:
  65. cache: false
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...