workers.tf 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256
  1. # Some instance variables
  2. locals {
  3. instance_name_worker = "${var.prefix}-alsi-worker"
  4. splunk_vpc_cidrs = toset(concat([var.vpc_cidr], local.cidr_map["vpc-private-services"]))
  5. data_sources = toset(concat(tolist(local.splunk_vpc_cidrs), local.splunk_data_sources))
  6. }
  7. resource "aws_network_interface" "worker" {
  8. count = local.alsi_workers
  9. subnet_id = var.subnets[count.index % length(var.subnets)] # evenly distributed across subnets
  10. security_groups = [data.aws_security_group.typical-host.id, aws_security_group.alsi_worker_security_group.id]
  11. description = "${local.instance_name_worker}-${count.index}"
  12. tags = merge(local.standard_tags,
  13. var.tags,
  14. {
  15. Name = "${local.instance_name_worker}-${count.index}",
  16. instance_num = count.index,
  17. instance_count = local.alsi_workers
  18. }
  19. )
  20. }
  21. resource "aws_instance" "worker" {
  22. count = local.alsi_workers
  23. #availability_zone = var.azs[count.index % 2] # automatically determined by the network interface
  24. tenancy = "default"
  25. ebs_optimized = true
  26. disable_api_termination = var.instance_termination_protection
  27. instance_initiated_shutdown_behavior = "stop"
  28. instance_type = local.instance_types["alsi-worker"]
  29. key_name = "msoc-build"
  30. monitoring = false # checkov:skip=CKV_AWS_126:Detailed monitoring not needed at this time
  31. iam_instance_profile = "msoc-default-instance-profile"
  32. metadata_options {
  33. http_endpoint = "enabled"
  34. # checkov:skip=CKV_AWS_79:see tfsec explanation
  35. # tfsec:ignore:aws-ec2-enforce-http-token-imds Saltstack doesn't use s3 sources appropriately; see https://github.com/saltstack/salt/issues/60668
  36. http_tokens = "optional"
  37. }
  38. ami = local.ami_map[local.ami_selection]
  39. # We need to ignore ebs_block_device changes, because if the AMI changes, so does the snapshot_id.
  40. # If they add a feature to block more specific changes (eg `ebs_block_devices[*].snapshot_id`), then
  41. # that could be removed.
  42. lifecycle { ignore_changes = [ami, key_name, user_data, ebs_block_device] }
  43. # These device definitions are optional, but added for clarity.
  44. root_block_device {
  45. volume_type = "gp3"
  46. #volume_size = Override via var?
  47. delete_on_termination = true
  48. encrypted = true
  49. kms_key_id = data.aws_kms_key.ebs-key.arn
  50. }
  51. network_interface {
  52. device_index = 0
  53. network_interface_id = aws_network_interface.worker[count.index].id
  54. }
  55. user_data = data.template_cloudinit_config.cloud-init-worker[count.index].rendered
  56. tags = merge(local.standard_tags,
  57. var.tags,
  58. {
  59. Name = "${local.instance_name_worker}-${count.index}",
  60. instance_num = count.index,
  61. instance_count = local.alsi_workers
  62. }
  63. )
  64. volume_tags = merge(local.standard_tags,
  65. var.tags,
  66. {
  67. Name = "${local.instance_name_worker}-${count.index}",
  68. instance_num = count.index,
  69. instance_count = local.alsi_workers
  70. }
  71. )
  72. }
  73. module "private_dns_record_worker" {
  74. count = local.alsi_workers
  75. source = "../../../submodules/dns/private_A_record"
  76. name = "${local.instance_name_worker}-${count.index}"
  77. ip_addresses = [aws_instance.worker[count.index].private_ip]
  78. dns_info = var.dns_info
  79. reverse_enabled = var.reverse_enabled
  80. providers = {
  81. aws.c2 = aws.c2
  82. }
  83. }
  84. # Render a multi-part cloud-init config making use of the part
  85. # above, and other source files
  86. data "template_cloudinit_config" "cloud-init-worker" {
  87. count = local.alsi_workers
  88. gzip = true
  89. base64_encode = true
  90. # Main cloud-config configuration file.
  91. part {
  92. filename = "init.cfg"
  93. content_type = "text/cloud-config"
  94. content = templatefile("${path.module}/cloud-init/cloud-init.tpl",
  95. {
  96. hostname = "${local.instance_name_worker}-${count.index}"
  97. fqdn = "${local.instance_name_worker}-${count.index}.${var.dns_info["private"]["zone"]}"
  98. splunk_prefix = var.prefix
  99. environment = var.environment
  100. salt_master = local.salt_master
  101. proxy = local.proxy
  102. aws_partition = var.aws_partition
  103. aws_partition_alias = var.aws_partition_alias
  104. aws_region = var.aws_region
  105. }
  106. )
  107. }
  108. }
  109. ## ALSI Worker
  110. #
  111. # Summary:
  112. # Ingress:
  113. # 9000 - From ALBs
  114. # 9000 - From vpc-access
  115. # 8088 - From alb_hec
  116. # 9200 - From alb_elastic
  117. # 8088 - From alb_splunk_hec
  118. #
  119. # Egress:
  120. # 4200 - To master
  121. # 9997 - To Splunk
  122. resource "aws_security_group" "alsi_worker_security_group" {
  123. name_prefix = "${var.prefix}_alsi_worker_security_group" # name prefix and livecycle allow for smooth updates
  124. lifecycle { create_before_destroy = true } # handle updates gracefully
  125. description = "Security Group for Aggregated Log Source Ingestion"
  126. vpc_id = var.vpc_id
  127. tags = merge(local.standard_tags, var.tags)
  128. }
  129. #----------------------------------------------------------------------------
  130. # INGRESS
  131. #----------------------------------------------------------------------------
  132. resource "aws_security_group_rule" "alsi_worker_alb_elastic1" {
  133. description = "Health Check"
  134. type = "ingress"
  135. from_port = 9000
  136. to_port = 9000
  137. protocol = "tcp"
  138. source_security_group_id = aws_security_group.alsi-alb-elastic-sg.id
  139. security_group_id = aws_security_group.alsi_worker_security_group.id
  140. }
  141. resource "aws_security_group_rule" "alsi_worker_alb_elastic2" {
  142. description = "Data Stream"
  143. type = "ingress"
  144. from_port = 9200
  145. to_port = 9200
  146. protocol = "tcp"
  147. source_security_group_id = aws_security_group.alsi-alb-elastic-sg.id
  148. security_group_id = aws_security_group.alsi_worker_security_group.id
  149. }
  150. # TODO: Repeat top 2 for HEC and S2S forwarders
  151. resource "aws_security_group_rule" "alsi_worker_vpn_in1" {
  152. description = "Web access from VPN"
  153. type = "ingress"
  154. from_port = 9000
  155. to_port = 9000
  156. protocol = "tcp"
  157. cidr_blocks = local.cidr_map["vpc-access"]
  158. security_group_id = aws_security_group.alsi_worker_security_group.id
  159. }
  160. resource "aws_security_group_rule" "alsi_worker_vpn_in2" {
  161. description = "Web access from VPN"
  162. type = "ingress"
  163. from_port = 9200
  164. to_port = 9200
  165. protocol = "tcp"
  166. cidr_blocks = local.cidr_map["vpc-access"]
  167. security_group_id = aws_security_group.alsi_worker_security_group.id
  168. }
  169. resource "aws_security_group_rule" "alsi_worker_vpn_in3" {
  170. description = "Splunk access from VPN"
  171. type = "ingress"
  172. from_port = 9997
  173. to_port = 9998
  174. protocol = "tcp"
  175. cidr_blocks = local.cidr_map["vpc-access"]
  176. security_group_id = aws_security_group.alsi_worker_security_group.id
  177. }
  178. resource "aws_security_group_rule" "alsi_worker_vpn_in4" {
  179. description = "HEC access from VPN"
  180. type = "ingress"
  181. from_port = 8088
  182. to_port = 8088
  183. protocol = "tcp"
  184. cidr_blocks = local.cidr_map["vpc-access"]
  185. security_group_id = aws_security_group.alsi_worker_security_group.id
  186. }
  187. resource "aws_security_group_rule" "alsi_worker_external_in" {
  188. # NLB requires the security group to allow access
  189. description = "Splunk access via NLB"
  190. count = local.alsi_splunk_nlb ? 1 : 0
  191. type = "ingress"
  192. from_port = 9997
  193. to_port = 9998
  194. protocol = "tcp"
  195. cidr_blocks = local.data_sources
  196. security_group_id = aws_security_group.alsi_worker_security_group.id
  197. }
  198. resource "aws_security_group_rule" "alsi_worker_hec_in" {
  199. description = "HEC access from Customer"
  200. type = "ingress"
  201. from_port = 8088
  202. to_port = 8088
  203. protocol = "tcp"
  204. cidr_blocks = local.data_sources
  205. security_group_id = aws_security_group.alsi_worker_security_group.id
  206. }
  207. #----------------------------------------------------------------------------
  208. # EGRESS
  209. #----------------------------------------------------------------------------
  210. resource "aws_security_group_rule" "alsi-interconnections" {
  211. description = "Cribl Replication"
  212. type = "egress"
  213. from_port = 4200
  214. to_port = 4200
  215. protocol = "tcp"
  216. source_security_group_id = aws_security_group.alsi_master_security_group.id
  217. security_group_id = aws_security_group.alsi_worker_security_group.id
  218. }
  219. resource "aws_security_group_rule" "alsi-worker-splunk-mgmt" {
  220. description = "Management Access"
  221. type = "egress"
  222. from_port = 8089
  223. to_port = 8089
  224. protocol = "tcp"
  225. cidr_blocks = [var.vpc_cidr]
  226. security_group_id = aws_security_group.alsi_worker_security_group.id
  227. }
  228. resource "aws_security_group_rule" "alsi-worker-splunk-data" {
  229. description = "Management Access"
  230. type = "egress"
  231. from_port = 9997
  232. to_port = 9998
  233. protocol = "tcp"
  234. cidr_blocks = [var.vpc_cidr]
  235. security_group_id = aws_security_group.alsi_worker_security_group.id
  236. }