Register
Login
Resources
Docs Blog Datasets Glossary Case Studies Tutorials & Webinars
Product
Data Engine LLMs Platform Enterprise
Pricing Explore
Connect to our Discord channel

dvc.yaml 4.1 KB

You have to be logged in to leave a comment. Sign In
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
  1. # dvc project pipeline
  2. # NOTE: see scripts/README.MD for preprocessing from raw data up to the first
  3. # tracked stage `createtiles`
  4. stages:
  5. createtiles:
  6. foreach:
  7. - 2017
  8. - 2018
  9. - 2019
  10. - 2020
  11. do:
  12. cmd: >-
  13. mkdir -p data/processed.images.${item};
  14. gdal_retile.py
  15. -csv locations.csv
  16. -v -ps ${source_dim} ${source_dim}
  17. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "ALPHA=NO" -co "NUM_THREADS=ALL_CPUS"
  18. -targetDir data/processed.images.${item}
  19. data/raw/ortho_ms_${item}_EPSG3044.tif
  20. deps:
  21. - data/raw/ortho_ms_${item}_EPSG3044.tif
  22. params:
  23. - source_dim
  24. outs:
  25. - data/processed.images.${item}
  26. computestats:
  27. cmd: >-
  28. python scripts/computestats.py --frac 0.1
  29. data/processed.images.2017
  30. data/processed.images.2018
  31. data/processed.images.2019
  32. data/processed.images.2020
  33. deps:
  34. - data/processed.images.2017
  35. - data/processed.images.2018
  36. - data/processed.images.2019
  37. - data/processed.images.2020
  38. outs:
  39. - data/processed.images.stats.json
  40. createmasks:
  41. foreach:
  42. - 2017
  43. - 2018
  44. - 2019
  45. - 2020
  46. do:
  47. cmd: >-
  48. python scripts/createmasks.py
  49. data/processed.images.${item}
  50. data/processed.masks.${item}
  51. data/raw/shapefiles/deadtrees_${item}/deadtrees_${item}.shp
  52. deps:
  53. - data/processed.images.${item}
  54. - data/raw/shapefiles/deadtrees_${item}
  55. outs:
  56. - data/processed.masks.${item}
  57. createforestmasks:
  58. foreach:
  59. - 2017
  60. - 2018
  61. - 2019
  62. - 2020
  63. do:
  64. cmd: >-
  65. python scripts/createmasks.py
  66. data/processed.images.${item}
  67. data/processed.lus.${item}
  68. data/raw/shapefiles/forestmask/CORINE_forest.shp
  69. --simple
  70. deps:
  71. - data/processed.images.${item}
  72. - data/raw/shapefiles/forestmask/CORINE_forest.shp
  73. outs:
  74. - data/processed.lus.${item}
  75. createdataset:
  76. foreach:
  77. - 2017
  78. - 2018
  79. - 2019
  80. - 2020
  81. do:
  82. cmd: >-
  83. python scripts/createdataset.py
  84. data/processed.images.${item}
  85. data/processed.masks.${item}
  86. data/processed.lus.${item}
  87. data/dataset
  88. --subdir train_${item}
  89. --source_dim ${source_dim}
  90. --tile_size ${createdataset.tile_size}
  91. --format ${file_type}
  92. --stats stats_${item}.csv
  93. deps:
  94. - data/processed.images.${item}
  95. - data/processed.masks.${item}
  96. - data/processed.lus.${item}
  97. params:
  98. - source_dim
  99. - createdataset.tile_size
  100. - file_type
  101. outs:
  102. - data/dataset/train_${item}
  103. - data/dataset/stats_${item}.csv
  104. # we only merge 2017, 2019 for train, val, test - 2018, 2020 are test only
  105. mergedatasets:
  106. cmd: >-
  107. python scripts/mergedatasets.py data/dataset/train_2017 data/dataset/train_2019
  108. deps:
  109. - data/dataset/train_2017
  110. - data/dataset/train_2019
  111. outs:
  112. - data/dataset/train
  113. - data/dataset/val
  114. - data/dataset/test
  115. # train: do this manually
  116. # inference
  117. inference:
  118. foreach:
  119. - 2017
  120. - 2018
  121. - 2019
  122. - 2020
  123. do:
  124. cmd: >-
  125. mkdir -p data/predicted.${item};
  126. stdbuf -i0 -o0 -e0 python scripts/inference.py --all --nopreview -o data/predicted.${item} data/processed.images.${item};
  127. gdal_merge.py
  128. -co "TILED=YES" -co "COMPRESS=LZW" -co "PREDICTOR=2" -co "NUM_THREADS=ALL_CPUS"
  129. -o data/predicted_mosaic_${item}.tif
  130. data/predicted.${item}/ortho_ms_${item}_EPSG3044_*
  131. deps:
  132. - data/processed.images.${item}
  133. - checkpoints/bestmodel.ckpt
  134. outs:
  135. - data/predicted.${item}
  136. - data/predicted_mosaic_${item}.tif
  137. computestatsinference:
  138. cmd: >-
  139. python scripts/computestats_inference.py
  140. data/predicted.2017
  141. data/predicted.2018
  142. data/predicted.2019
  143. data/predicted.2020
  144. deps:
  145. - data/predicted.2017
  146. - data/predicted.2018
  147. - data/predicted.2019
  148. - data/predicted.2020
  149. outs:
  150. - data/predicted.stats.csv
Tip!

Press p or to see the previous file or, n or to see the next file

Comments

Loading...