This repository has been archived by the owner on Jun 1, 2023. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 13
/
Snakefile
110 lines (95 loc) · 3.49 KB
/
Snakefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
# import global scripts
import sys
import os
# add all the src directories to the path so that we have access to the scripts
def add_all_src_dir():
for contents in os.walk('.'):
directory = contents[0]
if directory.endswith('src'):
sys.path.insert(0, directory)
# import local scripts
add_all_src_dir()
import catch_attr
import aggregate_upstream
configfile: 'catchment_attr_links.yaml'
regions = ['02']
cat_att_dir = '20_catchment_attributes/out'
rule all:
input:
metadata = f"{cat_att_dir}/combined_metadata.csv",
seg_attr = expand("{fldr}/combined_seg_attr_{region}.feather", fldr=cat_att_dir, region=regions),
drb_attr = f"{cat_att_dir}/seg_attr_drb.feather",
subset_drb_attr = f"{cat_att_dir}/seg_attr_drb_subset.feather"
params_out_fmt = "{fldr}/GeospatialFabricAttributes-PRMS_{category}_{region}.gdb"
rule get_all_catchment_params:
output:
directory(params_out_fmt)
run:
catch_attr.download_unzip_cat_attr_data(wildcards.fldr,
wildcards.category,
wildcards.region)
rule combine_categories:
input:
'catchment_attr_links.yaml',
expand(params_out_fmt, fldr=cat_att_dir, category=config['categories'],
region=regions)
output:
"{fldr}/combined_categories_{region}.feather"
run:
catch_attr.combine_categories(input[1:], output[0])
rule add_ids_and_seg_attributes:
input:
'10_spatial_data/out/nsegmentNationalIdentifier.csv',
'10_spatial_data/out/nhruNationalIdentifier.csv',
rules.combine_categories.output
output:
"{fldr}/combined_cats_w_ids_{region}.feather"
run:
catch_attr.add_ids_and_seg_attr(input[0], input[1], input[2], wildcards.region, output[0])
rule relate_to_segments:
input:
rules.add_ids_and_seg_attributes.output
output:
"{fldr}/combined_seg_attr_{region}.feather"
run:
catch_attr.relate_attr_to_segments(input[0], output[0], True)
rule subset_attr_to_drb:
input:
# this is a shapefile of the entire DRB cutout
"10_spatial_data/out/Segments_subset.shp",
f"{cat_att_dir}/combined_seg_attr_02.feather"
output:
rules.all.input.drb_attr
run:
catch_attr.subset_for_drb(input[0], input[1], output[0])
rule subset_attr_drb_subset:
input:
# this is a list of link ids that are in the subset of the DRB (the small subset Xiaowei started with)
"10_spatial_data/out/sntemp_subset_ids.csv",
f"{cat_att_dir}/combined_seg_attr_02.feather"
output:
rules.all.input.subset_drb_attr
run:
catch_attr.subset_for_drb_subset(input[0], input[1], output[0])
rule aggregate_upstream:
input:
f"{cat_att_dir}/combined_seg_attr_02.feather",
"10_spatial_data/out/high_obs_upstream_sites.csv"
output:
f"{cat_att_dir}/aggregated_upstream.feather"
run:
aggregate_upstream.aggregate_upstream_attr(input[0], input[1], output[0])
metadata_file_fmt = "{fldr}/{category}_metadata.xml"
rule get_metadata_xml_files:
output:
metadata_file_fmt
run:
catch_attr.get_metadata_file(wildcards.category, output[0])
rule combine_metadata_files:
input:
metadata_files = expand(metadata_file_fmt, fldr=cat_att_dir,
category=config['categories'])
output:
rules.all.input.metadata
run:
catch_attr.consolidate_metdata(input, output[0])