Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 4.9 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
  1. # dvc project pipeline
  2. # NOTE: see scripts/README.MD for preprocessing from raw data up to the first
  3. # tracked stage `createtiles`
  4. stages:
  5. createtiles:
  6. foreach:
  7. - 2017
  8. - 2018
  9. - 2019
  10. - 2020
  11. do:
  12. cmd: >-
  13. mkdir -p data/processed.images.${item};
  14. gdal_retile.py
  15. -csv locations.csv
  16. -v -ps ${source_dim} ${source_dim}
  17. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "ALPHA=NO" -co "NUM_THREADS=ALL_CPUS"
  18. -targetDir data/processed.images.${item}
  19. data/raw/ortho_ms_${item}_EPSG3044.tif
  20. deps:
  21. - data/raw/ortho_ms_${item}_EPSG3044.tif
  22. params:
  23. - source_dim
  24. outs:
  25. - data/processed.images.${item}
  26. computestats:
  27. cmd: >-
  28. python scripts/computestats.py --frac 0.1
  29. data/processed.images.2017
  30. data/processed.images.2018
  31. data/processed.images.2019
  32. data/processed.images.2020
  33. deps:
  34. - data/processed.images.2017
  35. - data/processed.images.2018
  36. - data/processed.images.2019
  37. - data/processed.images.2020
  38. outs:
  39. - data/processed.images.stats.json
  40. createmasks:
  41. foreach:
  42. - 2017
  43. - 2018
  44. - 2019
  45. - 2020
  46. do:
  47. cmd: >-
  48. python scripts/createmasks.py
  49. data/processed.images.${item}
  50. data/processed.masks.${item}
  51. data/raw/shapefiles/deadtrees_${item}/deadtrees_${item}.shp
  52. deps:
  53. - data/processed.images.${item}
  54. - data/raw/shapefiles/deadtrees_${item}
  55. outs:
  56. - data/processed.masks.${item}
  57. createforestmasks:
  58. foreach:
  59. - 2017
  60. - 2018
  61. - 2019
  62. - 2020
  63. do:
  64. cmd: >-
  65. python scripts/createmasks.py
  66. data/processed.images.${item}
  67. data/processed.lus.${item}
  68. data/raw/shapefiles/forestmask/CORINE_forest.shp
  69. --simple
  70. deps:
  71. - data/processed.images.${item}
  72. - data/raw/shapefiles/forestmask/CORINE_forest.shp
  73. outs:
  74. - data/processed.lus.${item}
  75. createdataset:
  76. foreach:
  77. - 2017
  78. - 2018
  79. - 2019
  80. - 2020
  81. do:
  82. cmd: >-
  83. python scripts/createdataset.py
  84. data/processed.images.${item}
  85. data/processed.masks.${item}
  86. data/processed.lus.${item}
  87. data/dataset
  88. --subdir train_${item}
  89. --source_dim ${source_dim}
  90. --tile_size ${createdataset.tile_size}
  91. --format ${file_type}
  92. --stats stats_${item}.csv
  93. deps:
  94. - data/processed.images.${item}
  95. - data/processed.masks.${item}
  96. - data/processed.lus.${item}
  97. params:
  98. - source_dim
  99. - createdataset.tile_size
  100. - file_type
  101. outs:
  102. - data/dataset/train_${item}
  103. - data/dataset/stats_${item}.csv
  104. # we only merge 2017, 2019 for train, val, test - 2018, 2020 are test only
  105. mergedatasets:
  106. cmd: >-
  107. python scripts/mergedatasets.py data/dataset/train_2017 data/dataset/train_2019
  108. deps:
  109. - data/dataset/train_2017
  110. - data/dataset/train_2019
  111. outs:
  112. - data/dataset/train
  113. - data/dataset/val
  114. - data/dataset/test
  115. # train: do this manually
  116. # inference
  117. # overlap values possible: 32px or 128px
  118. inference:
  119. foreach:
  120. - 2017
  121. - 2018
  122. - 2019
  123. - 2020
  124. do:
  125. cmd: >-
  126. mkdir -p data/predicted.${item};
  127. stdbuf -i0 -o0 -e0
  128. python scripts/inference.py --all --overlap 32 -o data/predicted.${item} data/processed.images.${item}
  129. -m checkpoints/earnest-dew-216_epoch_235.ckpt
  130. -m checkpoints/fine-lake-207_epoch_279.ckpt
  131. -m checkpoints/sage-glitter-214_epoch_106.ckpt;
  132. gdal_merge.py
  133. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "NUM_THREADS=ALL_CPUS"
  134. -o data/predicted_mosaic_${item}.tif
  135. data/predicted.${item}/ortho_ms_${item}_EPSG3044_*
  136. deps:
  137. - data/processed.images.${item}
  138. - checkpoints/earnest-dew-216_epoch_235.ckpt
  139. - checkpoints/fine-lake-207_epoch_279.ckpt
  140. - checkpoints/sage-glitter-214_epoch_106.ckpt
  141. outs:
  142. - data/predicted.${item}
  143. - data/predicted_mosaic_${item}.tif
  144. computestatsinference:
  145. cmd: >-
  146. python scripts/computestats_inference.py
  147. data/predicted.2017
  148. data/predicted.2018
  149. data/predicted.2019
  150. data/predicted.2020
  151. deps:
  152. - data/predicted.2017
  153. - data/predicted.2018
  154. - data/predicted.2019
  155. - data/predicted.2020
  156. outs:
  157. - data/predicted.stats.csv
  158. computeaggregatemaps:
  159. cmd: >-
  160. mkdir data/maps;
  161. python scripts/aggregate_results.py
  162. data/processed.lus.2017
  163. data/processed.lus.2018
  164. data/processed.lus.2019
  165. data/processed.lus.2020
  166. deps:
  167. - data/predicted.2017
  168. - data/predicted.2018
  169. - data/predicted.2019
  170. - data/predicted.2020
  171. - data/processed.lus.2017
  172. - data/processed.lus.2018
  173. - data/processed.lus.2019
  174. - data/processed.lus.2020
  175. outs:
  176. - data/maps
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...