-
Notifications
You must be signed in to change notification settings - Fork 3
/
variables.tf
161 lines (132 loc) · 4.44 KB
/
variables.tf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
# This file declares terraform variables that are used in the main file
# Values are assigned in the terraform.tfvars file
variable "lambda_name" {
description = "name of the lambda function that collects CDX records from the Internet Archive"
type = string
default = "my_lambda"
}
variable "result_bucket" {
description = "name of the s3 bucket where scraping results stored"
type = string
default = "my_result_bucket"
}
variable "result_bucket_folder" {
description = "name of the folder in which scraping results will be stored, this works with the result_bucket variable"
type = string
default = ""
}
variable "code_bucket" {
description = "name of the s3 bucket where lambda zip and tfstate are stored"
type = string
default = "my_code_bucket"
}
variable "cdx_logging_level" {
description = "set the log level, log messages which are less severe than level will be ignored"
type = string
default = "info"
validation {
condition = var.cdx_logging_level == "info" || var.cdx_logging_level == "error"
error_message = "Allowed values are: 'info' or 'error'."
}
}
variable "scraper_logging_level" {
description = "set the log level, log messages which are less severe than level will be ignored"
type = string
default = "info"
validation {
condition = var.scraper_logging_level == "info" || var.scraper_logging_level == "error"
error_message = "Allowed values are: 'info' or 'error'."
}
}
variable "custom_log_group" {
description = "AWS log group for metrics"
type = string
default = "my_log_group"
}
variable "custom_log_stream_cdx" {
description = "custom log stream for CDX metrics"
type = string
default = "my_cdx_log_stream"
}
variable "custom_log_stream_scrape" {
description = "custom log stream for scrape metrics"
type = string
default = "my_scrape_log_stream"
}
variable "sqs_fetch_limit" {
description = "max number of allowed messages in Fetch SQS queue. When this limit is reached, no new messages are added"
type = string
default = "100000"
}
variable "sqs_cdx_max_messages" {
description = "the max number of messages received from the CDX SQS queue in 1 iteration"
type = string
default = "10"
}
variable "cdx_lambda_n_iterations" {
description = "the number of iterations the CDX function runs. Every iteration the cdx function processes max N='sqs_cdx_max_messages' messages"
type = string
default = "20"
}
variable "cdx_run_id" {
description = "the ID of the crunchbase scrape run; this will be added as identifier to the cdx metrics logged in cloudwatch"
type = string
default = "1"
}
variable "ia_payload_year_from" {
description = "starting year parameter form Internet Archive request payload"
type = string
default = "2018"
}
variable "ia_payload_year_to" {
description = "end year parameter form Internet Archive request payload"
type = string
default = "2022"
}
variable "match_exact_url" {
description = "match only the exact URL provided (ignores presence or absence of 'www.')"
type = string
default = "0"
}
variable "formats_to_save" {
description = "file formats to export (possible values: txt,links,html)"
type = string
default = "txt,links"
}
variable "url_limit_per_domain" {
description = "max. number of URLs to fetch from a single domain"
type = number
default = 1000
}
variable "sqs_message_author" {
description = "author of messages in SQS queue"
type = string
default = "author"
}
variable "deployment_name" {
description = "The name of the terraform deployment. This name is used for all resources."
default = "author"
}
variable "s3_destination_bucket_arn" {
description = "The S3 destination bucket."
default = "author"
}
variable "s3_destination_bucket" {
description = "The S3 destination bucket."
default = "author"
}
variable "glue_catalog_database_name" {
description = "The Glue catalog database name"
type = string
default = "author"
}
variable "glue_catalog_table_name" {
description = "The Glue catalog database table name"
type = string
default = "author"
}
variable "iam_role_lambda_scrape_name" {
description = "The IAM Role name of the Lambda Scrape function that sends data to Kinesis Firehose."
type = string
default = "author"
}