So I have a similar problem, but my “failure_trigger_sample_size”: is 2.
I’m load balancing between three nodes, wiwnd331-333.
If I shut down one of the nodes (333), this is the gateway log:
[HOST CHECKER MANAGER] Host is DOWN: http://wiwnd333.net:19081/HealthCheckEndpoint.Application/HealthCheckEndpoint/Health
http: proxy error: read tcp connection reset by peer" server_name=“wiwnd333.net:19081”
I have an own API Definition that should do the health checks for all my other APIs that also connect to those three nodes:
{
"id": "xx",
"name": "Health Check",
"slug": "health-check",
"api_id": "xx",
"org_id": "xx",
"use_keyless": true,
"use_oauth2": false,
"use_openid": false,
"openid_options": {
"providers": [],
"segregate_by_client": false
},
"oauth_meta": {
"allowed_access_types": [],
"allowed_authorize_types": [],
"auth_login_redirect": ""
},
"auth": {
"use_param": false,
"param_name": "",
"use_cookie": false,
"cookie_name": "",
"auth_header_name": ""
},
"use_basic_auth": false,
"enable_jwt": false,
"use_standard_auth": false,
"enable_coprocess_auth": false,
"jwt_signing_method": "",
"jwt_source": "",
"jwt_identity_base_field": "",
"jwt_client_base_field": "",
"jwt_policy_field_name": "",
"notifications": {
"shared_secret": "",
"oauth_on_keychange_url": ""
},
"enable_signature_checking": false,
"hmac_allowed_clock_skew": -1,
"base_identity_provided_by": "",
"definition": {
"location": "header",
"key": "x-api-version"
},
"version_data": {
"not_versioned": true,
"versions": {
"Default": {
"name": "Default",
"expires": "",
"paths": {
"ignored": [],
"white_list": [],
"black_list": []
},
"use_extended_paths": true,
"extended_paths": {},
"global_headers": {},
"global_headers_remove": [],
"global_size_limit": 0,
"override_target": ""
}
}
},
"uptime_tests": {
"check_list": [
{
"url": "http://wiwnd331.net:19081/HealthCheckEndpoint.Application/HealthCheckEndpoint/Health",
"method": "GET",
"headers": {},
"body": ""
},
{
"url": "http://wiwnd332.net:19081/HealthCheckEndpoint.Application/HealthCheckEndpoint/Health",
"method": "GET",
"headers": {},
"body": ""
},
{
"url": "http://wiwnd333.net:19081/HealthCheckEndpoint.Application/HealthCheckEndpoint/Health",
"method": "GET",
"headers": {},
"body": ""
}
],
"config": {
"expire_utime_after": 0,
"service_discovery": {
"use_discovery_service": false,
"query_endpoint": "",
"use_nested_query": false,
"parent_data_path": "",
"data_path": "",
"port_data_path": "",
"target_path": "",
"use_target_list": false,
"cache_timeout": 60,
"endpoint_returns_list": false
},
"recheck_wait": 0
}
},
"proxy": {
"preserve_host_header": false,
"listen_path": "/health-check/",
"target_url": "/",
"strip_listen_path": true,
"enable_load_balancing": false,
"target_list": [],
"check_host_against_uptime_tests": true,
"service_discovery": {
"use_discovery_service": false,
"query_endpoint": "",
"use_nested_query": false,
"parent_data_path": "",
"data_path": "hostname",
"port_data_path": "port",
"target_path": "/api-slug",
"use_target_list": false,
"cache_timeout": 60,
"endpoint_returns_list": false
}
},
"disable_rate_limit": false,
"disable_quota": false,
"custom_middleware": {
"pre": [],
"post": [],
"post_key_auth": [],
"auth_check": {
"name": "",
"path": "",
"require_session": false
},
"response": [],
"driver": "",
"id_extractor": {
"extract_from": "",
"extract_with": "",
"extractor_config": {}
}
},
"custom_middleware_bundle": "",
"cache_options": {
"cache_timeout": 60,
"enable_cache": true,
"cache_all_safe_requests": false,
"cache_response_codes": [],
"enable_upstream_cache_control": false
},
"session_lifetime": 0,
"active": true,
"auth_provider": {
"name": "",
"storage_engine": "",
"meta": {}
},
"session_provider": {
"name": "",
"storage_engine": "",
"meta": null
},
"event_handlers": {
"events": {}
},
"enable_batch_request_support": false,
"enable_ip_whitelisting": false,
"allowed_ips": [],
"dont_set_quota_on_create": false,
"expire_analytics_after": 0,
"response_processors": [],
"CORS": {
"enable": false,
"allowed_origins": [],
"allowed_methods": [],
"allowed_headers": [],
"exposed_headers": [],
"allow_credentials": false,
"max_age": 24,
"options_passthrough": false,
"debug": false
},
"domain": "xx",
"do_not_track": false,
"tags": [],
"enable_context_vars": false
}
The problem: every 3rd request runs into “There was a problem proxying the request”.
After the machine comes up again, the gateway notices it:
[HOST CHECKER MANAGER] Host is UP: http://wiwnd333.net:19081/HealthCheckEndpoint.Application/HealthCheckEndpoint/Health
And this is the API I try to call:
{
"id": "xx",
"name": "DealerSearch",
"slug": "dealersearch",
"api_id": "xx",
"org_id": "xx",
"use_keyless": false,
"use_oauth2": false,
"use_openid": false,
"openid_options": {
"providers": [],
"segregate_by_client": false
},
"oauth_meta": {
"allowed_access_types": [],
"allowed_authorize_types": [],
"auth_login_redirect": ""
},
"auth": {
"use_param": false,
"param_name": "",
"use_cookie": false,
"cookie_name": "",
"auth_header_name": "X-ApiKey"
},
"use_basic_auth": false,
"enable_jwt": false,
"use_standard_auth": true,
"enable_coprocess_auth": false,
"jwt_signing_method": "",
"jwt_source": "",
"jwt_identity_base_field": "",
"jwt_client_base_field": "",
"jwt_policy_field_name": "",
"notifications": {
"shared_secret": "",
"oauth_on_keychange_url": ""
},
"enable_signature_checking": false,
"hmac_allowed_clock_skew": -1,
"base_identity_provided_by": "",
"definition": {
"location": "header",
"key": "Accept"
},
"version_data": {
"not_versioned": true,
"versions": {
"application/vnd.x.v1+json": {
"name": "application/vnd.x.v1+json",
"expires": "",
"paths": {
"ignored": [],
"white_list": [],
"black_list": []
},
"use_extended_paths": true,
"extended_paths": {},
"global_headers": {},
"global_headers_remove": [],
"global_size_limit": 0,
"override_target": ""
}
}
},
"uptime_tests": {
"check_list": [],
"config": {
"expire_utime_after": 0,
"service_discovery": {
"use_discovery_service": false,
"query_endpoint": "xxx",
"use_nested_query": false,
"parent_data_path": "",
"data_path": "tests",
"port_data_path": "",
"target_path": "",
"use_target_list": false,
"cache_timeout": 60,
"endpoint_returns_list": false
},
"recheck_wait": 0
}
},
"proxy": {
"preserve_host_header": false,
"listen_path": "/dealersearch/",
"target_url": "",
"strip_listen_path": true,
"enable_load_balancing": true,
"target_list": [
"http://wiwnd331.net:19081/DealerApplication/DealerService/",
"http://wiwnd332.net:19081/DealerApplication/DealerService/",
"http://wiwnd333.net:19081/DealerApplication/DealerService/"
],
"check_host_against_uptime_tests": true,
"service_discovery": {
"use_discovery_service": false,
"query_endpoint": "xxx",
"use_nested_query": false,
"parent_data_path": "",
"data_path": "Host",
"port_data_path": "Port",
"target_path": "",
"use_target_list": false,
"cache_timeout": 60,
"endpoint_returns_list": false
}
},
"disable_rate_limit": false,
"disable_quota": false,
"custom_middleware": {
"pre": [],
"post": [],
"post_key_auth": [],
"auth_check": {
"name": "",
"path": "",
"require_session": false
},
"response": [],
"driver": "",
"id_extractor": {
"extract_from": "",
"extract_with": "",
"extractor_config": {}
}
},
"custom_middleware_bundle": "",
"cache_options": {
"cache_timeout": 60,
"enable_cache": true,
"cache_all_safe_requests": false,
"cache_response_codes": [
200
],
"enable_upstream_cache_control": false
},
"session_lifetime": 0,
"active": true,
"auth_provider": {
"name": "",
"storage_engine": "",
"meta": {}
},
"session_provider": {
"name": "",
"storage_engine": "",
"meta": null
},
"event_handlers": {
"events": {}
},
"enable_batch_request_support": false,
"enable_ip_whitelisting": false,
"allowed_ips": [],
"dont_set_quota_on_create": false,
"expire_analytics_after": 0,
"response_processors": [],
"CORS": {
"enable": true,
"allowed_origins": [
"xxx"
],
"allowed_methods": [],
"allowed_headers": [
"xxx"
],
"exposed_headers": [],
"allow_credentials": false,
"max_age": 24,
"options_passthrough": false,
"debug": false
},
"domain": "xxx",
"do_not_track": false,
"tags": [],
"enable_context_vars": false
}
Sorry for the wall of text, but I try this since months but wasn’t able to get it to work since …
This is part of my tyk.conf… Timeout is 60 seconds and 2 samples with 30 seconds is allso 60 seconds… this may be a problem ?
"health_checks": {
"enable_health_checks": true,
"health_check_value_timeouts": 60
},
"uptime_tests": {
"disable": false,
"config": {
"enable_uptime_analytics": true,
"failure_trigger_sample_size": 2,
"time_wait": 30,
"checker_pool_size": 20
}
},