-
Notifications
You must be signed in to change notification settings - Fork 2
/
populationsim_settings.yaml
134 lines (110 loc) · 3.11 KB
/
populationsim_settings.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
####################################################################
# PopulationSim Properties
####################################################################
# Algorithm/Software Configuration
# ------------------------------------------------------------------
INTEGERIZE_WITH_BACKSTOPPED_CONTROLS: True
SUB_BALANCE_WITH_FLOAT_SEED_WEIGHTS: False
GROUP_BY_INCIDENCE_SIGNATURE: True
USE_SIMUL_INTEGERIZER: True
USE_CVXPY: False
max_expansion_factor: 30
# Geographic Settings
# ------------------------------------------------------------------
geographies: [region, PUMA, taz_id]
seed_geography: PUMA
# Tracing
# ------------------------------------------------------------------
#trace_geography:
# TAZ: 100
# TRACT: 10200
# Data Directory
# ------------------------------------------------------------------
data_dir: data
# Input Data Tables
# ------------------------------------------------------------------
# input_pre_processor input_table_list
input_table_list:
- tablename: households
filename : seed_households.csv
index_col: hh_id
column_map:
hhnum: hh_id
- tablename: persons
filename : seed_persons.csv
column_map:
hhnum: hh_id
SPORDER: per_num
- tablename: geo_cross_walk
filename : geo_cross_walk.csv
- tablename: taz_id_control_data
filename : future_controls.csv
# Reserved Column Names
# ------------------------------------------------------------------
household_weight_col: WGTP
household_id_col: hh_id
total_hh_control: num_hh
# Control Specification File Name
# ------------------------------------------------------------------
control_file_name: controls.csv
# Output Tables
# ------------------------------------------------------------------
# output_tables can specify either a list of output tables to include or to skip
# if neither is specified, then no tables will be written
output_tables:
action: include
tables:
- summary_taz_id
- expanded_household_ids
# Synthetic Population Output Specification
# ------------------------------------------------------------------
#
output_synthetic_population:
household_id: household_id
households:
filename: synthetic_households.csv
columns:
- NP
- VEH
- worker_count
- HHT
- HINCP
- WGTP
- hh_id
- TEN
persons:
filename: synthetic_persons.csv
columns:
- white_hispanic
- non_white_hispanic
- white_non_hispanic
- black_non_hispanic
- other_non_hispanic
- asian_non_hispanic
- two_or_more_races_non_hispanic
- AGEP
- SEX
- SCH
- is_worker
- hh_id
- per_num
- RAC1P
- HISP
- WKHP
- SCHG
# Steps for base mode
# ------------------------------------------------------------------
run_list:
steps:
- input_pre_processor
- setup_data_structures
- initial_seed_balancing
- meta_control_factoring
- final_seed_balancing
- integerize_final_seed_weights
- sub_balancing.geography=taz_id
- expand_households
- summarize
- write_tables
- write_synthetic_population
#resume_after: expand_households