Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 4.0 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
  1. # dvc project pipeline
  2. # NOTE: see scripts/README.MD for preprocessing from raw data up to the first
  3. # tracked stage `createtiles`
  4. stages:
  5. createtiles:
  6. foreach:
  7. - 2017
  8. - 2018
  9. - 2019
  10. - 2020
  11. do:
  12. cmd: >-
  13. mkdir -p data/processed.images.${item};
  14. gdal_retile.py
  15. -csv locations.csv
  16. -v -ps ${source_dim} ${source_dim}
  17. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "ALPHA=NO" -co "NUM_THREADS=ALL_CPUS"
  18. -targetDir data/processed.images.${item}
  19. data/raw/ortho_ms_${item}_EPSG3044.tif
  20. deps:
  21. - data/raw/ortho_ms_${item}_EPSG3044.tif
  22. params:
  23. - source_dim
  24. outs:
  25. - data/processed.images.${item}
  26. computestats:
  27. cmd: >-
  28. python scripts/computestats.py --frac 0.1
  29. data/processed.images.2017
  30. data/processed.images.2018
  31. data/processed.images.2019
  32. data/processed.images.2020
  33. deps:
  34. - data/processed.images.2017
  35. - data/processed.images.2018
  36. - data/processed.images.2019
  37. - data/processed.images.2020
  38. outs:
  39. - data/processed.images.stats.json
  40. createmasks:
  41. foreach:
  42. - 2017
  43. - 2019
  44. do:
  45. cmd: >-
  46. python scripts/createmasks.py
  47. data/processed.images.${item}
  48. data/processed.masks.${item}
  49. data/raw/shapefiles/deadtrees_${item}/deadtrees_${item}.shp
  50. deps:
  51. - data/processed.images.${item}
  52. - data/raw/shapefiles/deadtrees_${item}
  53. outs:
  54. - data/processed.masks.${item}
  55. createforestmasks:
  56. foreach:
  57. - 2017
  58. - 2019
  59. do:
  60. cmd: >-
  61. python scripts/createmasks.py
  62. data/processed.images.${item}
  63. data/processed.lus.${item}
  64. data/raw/shapefiles/forestmask/CORINE_forest.shp
  65. --simple
  66. deps:
  67. - data/processed.images.${item}
  68. - data/raw/shapefiles/forestmask/CORINE_forest.shp
  69. outs:
  70. - data/processed.lus.${item}
  71. createdataset:
  72. foreach:
  73. - 2017
  74. - 2019
  75. do:
  76. cmd: >-
  77. python scripts/createdataset.py
  78. data/processed.images.${item}
  79. data/processed.masks.${item}
  80. data/processed.lus.${item}
  81. data/dataset
  82. --subdir train_${item}
  83. --source_dim ${source_dim}
  84. --tile_size ${createdataset.tile_size}
  85. --format ${file_type}
  86. --stats stats_${item}.csv
  87. deps:
  88. - data/processed.images.${item}
  89. - data/processed.masks.${item}
  90. - data/processed.lus.${item}
  91. params:
  92. - source_dim
  93. - createdataset.tile_size
  94. - file_type
  95. outs:
  96. - data/dataset/train_${item}
  97. - data/dataset/stats_${item}.csv
  98. mergedatasets:
  99. cmd: >-
  100. python scripts/mergedatasets.py data/dataset/train_2017 data/dataset/train_2019
  101. deps:
  102. - data/dataset/train_2017
  103. - data/dataset/train_2019
  104. outs:
  105. - data/dataset/train
  106. - data/dataset/val
  107. - data/dataset/test
  108. # train: do this manually
  109. # inference
  110. inference:
  111. foreach:
  112. - 2017
  113. - 2018
  114. - 2019
  115. - 2020
  116. do:
  117. cmd: >-
  118. mkdir -p data/predicted.${item};
  119. stdbuf -i0 -o0 -e0 python scripts/inference.py --all --nopreview -o data/predicted.${item} data/processed.images.${item};
  120. gdal_merge.py
  121. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "NUM_THREADS=ALL_CPUS"
  122. -o data/predicted_mosaic_${item}.tif
  123. data/predicted.${item}/ortho_ms_${item}_EPSG3044_*
  124. deps:
  125. - data/processed.images.${item}
  126. - checkpoints/bestmodel.ckpt
  127. outs:
  128. - data/predicted.${item}
  129. - data/predicted_mosaic_${item}.tif
  130. computestatsinference:
  131. cmd: >-
  132. python scripts/computestats_inference.py
  133. data/predicted.2017
  134. data/predicted.2018
  135. data/predicted.2019
  136. data/predicted.2020
  137. deps:
  138. - data/predicted.2017
  139. - data/predicted.2018
  140. - data/predicted.2019
  141. - data/predicted.2020
  142. outs:
  143. - data/predicted.stats.csv
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...