Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.jsonnet 1.4 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
  1. local bd = import '../lib.jsonnet';
  2. local source_stages = {
  3. ratings: {
  4. 'scan-ratings': {
  5. cmd: bd.cmd('amazon scan-ratings -o ratings.parquet --swap-id-columns ../data/az2018/Books.csv'),
  6. deps: [
  7. '../src/amazon.rs',
  8. '../src/cli/amazon/',
  9. '../data/az2018/Books.csv',
  10. ],
  11. outs: ['ratings.parquet'],
  12. },
  13. },
  14. reviews: {
  15. 'scan-reviews': {
  16. cmd: bd.cmd('amazon scan-reviews --rating-output ratings.parquet --review-output reviews.parquet ../data/az2018/Books.json.gz'),
  17. deps: [
  18. '../src/amazon.rs',
  19. '../src/cli/amazon/',
  20. '../data/az2018/Books.json.gz',
  21. ],
  22. outs: [
  23. 'ratings.parquet',
  24. 'reviews.parquet',
  25. ],
  26. },
  27. },
  28. };
  29. bd.pipeline(source_stages[bd.config.az2018.source] {
  30. 'cluster-ratings': {
  31. wdir: '..',
  32. cmd: bd.cmd('amazon cluster-ratings -o az2018/az-cluster-ratings.parquet az2018/ratings.parquet'),
  33. deps: [
  34. 'src/cli/amazon',
  35. 'az2018/ratings.parquet',
  36. 'book-links/isbn-clusters.parquet',
  37. ],
  38. outs: ['az2018/az-cluster-ratings.parquet'],
  39. },
  40. 'cluster-ratings-5core': {
  41. cmd: bd.cmd('kcore -o az-cluster-ratings-5core.parquet az-cluster-ratings.parquet'),
  42. deps: [
  43. 'az-cluster-ratings.parquet',
  44. '../src/cli/kcore.rs',
  45. ],
  46. outs: ['az-cluster-ratings-5core.parquet'],
  47. },
  48. }, bd.config.az2018.enabled)
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...