Datasource has 35 dimensions and 45 metrics. The spec file
{
"type": "kafka",
"dataSchema": {
"dataSource": "MY_DATASOURCE_DAY",
"parser": {
"type": "string",
"parseSpec": {
"format": "json",
"timestampSpec": {
"column": "timestamp",
"format": "millis"
},
"dimensionsSpec": {
"dimensions": [
"mp_id",
"application_id",
"instance_id",
"action_name",
"message_type",
"from_path",
"path",
"open_path",
"close_path",
"scene",
"country_id",
"region_id",
"city_id",
"carrier_id",
"error_message",
"error_filename",
"request_method",
"host",
"uri",
"network_type",
"wechat_version",
"route_chain",
"uid",
"http_code",
"system",
"ip",
"device_type",
"agreement_id",
"protocol",
"error_type",
"error_detail",
"custom_code",
"api_name",
"opera_name",
"offset_left",
"offset_top",
"agent_version"
]
}
}
},
"metricsSpec": [
{
"name": "server_count",
"fieldName": "server_count",
"type": "longSum"
},
{
"name": "quit_count",
"fieldName": "quit_count",
"type": "longSum"
},
{
"name": "on_ready",
"fieldName": "on_ready",
"type": "doubleSum"
},
{
"name": "custom_time",
"fieldName": "custom_time",
"type": "longSum"
},
{
"name": "first_response_time",
"fieldName": "first_response_time",
"type": "doubleSum"
},
{
"name": "response_time",
"fieldName": "response_time",
"type": "doubleSum"
},
{
"name": "application_server_time",
"fieldName": "application_server_time",
"type": "doubleSum"
},
{
"name": "network_time",
"fieldName": "network_time",
"type": "doubleSum"
},
{
"name": "callback_time",
"fieldName": "callback_time",
"type": "longSum"
},
{
"name": "bytes_sent",
"fieldName": "bytes_sent",
"type": "longSum"
},
{
"name": "bytes_received",
"fieldName": "bytes_received",
"type": "longSum"
},
{
"name": "msg_error_pv",
"fieldName": "msg_error_pv",
"type": "longSum"
},
{
"name": "file_error_pv",
"fieldName": "file_error_pv",
"type": "longSum"
},
{
"name": "count",
"fieldName": "count",
"type": "longSum"
},
{
"name": "on_ready_count",
"fieldName": "on_ready_count",
"type": "longSum"
},
{
"name": "open_count",
"fieldName": "open_count",
"type": "longSum"
},
{
"name": "net_count",
"fieldName": "net_count",
"type": "longSum"
},
{
"name": "net_error_count",
"fieldName": "net_error_count",
"type": "longSum"
},
{
"name": "js_error_count",
"fieldName": "js_error_count",
"type": "longSum"
},
{
"name": "slow_count",
"fieldName": "slow_count",
"type": "longSum"
},
{
"name": "net_slow_count",
"fieldName": "net_slow_count",
"type": "longSum"
},
{
"name": "custom_success_count",
"fieldName": "custom_success_count",
"type": "longSum"
},
{
"name": "uv",
"fieldName": "uid",
"type": "thetaSketch"
},
{
"name": "api_success_count",
"fieldName": "api_success_count",
"type": "longSum"
},
{
"name": "api_fail_count",
"fieldName": "api_fail_count",
"type": "longSum"
},
{
"name": "api_count",
"fieldName": "api_count",
"type": "longSum"
},
{
"name": "api_cancel_count",
"fieldName": "api_cancel_count",
"type": "longSum"
},
{
"type": "longSum",
"name": "opera_time",
"fieldName": "opera_time",
"expression": null
},
{
"type": "longSum",
"name": "opera_request_time",
"fieldName": "opera_request_time",
"expression": null
},
{
"type": "longSum",
"name": "opera_server_time",
"fieldName": "opera_server_time",
"expression": null
},
{
"type": "longSum",
"name": "opera_count",
"fieldName": "opera_count",
"expression": null
},
{
"type": "longSum",
"name": "opera_request_count",
"fieldName": "opera_request_count",
"expression": null
},
{
"type": "longSum",
"name": "opera_success_count",
"fieldName": "opera_success_count",
"expression": null
},
{
"type": "longSum",
"name": "opera_fail_count",
"fieldName": "opera_fail_count",
"expression": null
},
{
"type": "longSum",
"name": "opera_slow_count",
"fieldName": "opera_slow_count",
"expression": null
},
{
"type": "longSum",
"name": "opera_server_count",
"fieldName": "opera_server_count",
"expression": null
},
{
"type": "longSum",
"name": "page_net_error_count",
"fieldName": "page_net_error_count",
"expression": null
},
{
"type" : "quantilesDoublesSketch",
"name" : "on_ready_sketch",
"fieldName" : "on_ready",
"k": 256
},
{
"type" : "quantilesDoublesSketch",
"name" : "first_response_time_sketch",
"fieldName" : "first_response_time",
"k": 256
},
{
"type" : "quantilesDoublesSketch",
"name" : "response_time_sketch",
"fieldName" : "response_time",
"k": 256
},
{
"type" : "quantilesDoublesSketch",
"name" : "network_time_sketch",
"fieldName" : "network_time",
"k": 256
},
{
"type" : "quantilesDoublesSketch",
"name" : "application_server_time_sketch",
"fieldName" : "application_server_time",
"k": 256
},
{
"type": "quantilesDoublesSketch",
"name": "opera_time_sketch",
"fieldName": "opera_time",
"k": 256
},
{
"type": "quantilesDoublesSketch",
"name": "opera_request_time_sketch",
"fieldName": "opera_request_time",
"k": 256
},
{
"type": "quantilesDoublesSketch",
"name": "opera_server_time_sketch",
"fieldName": "opera_server_time",
"k": 256
}
],
"granularitySpec": {
"type": "uniform",
"segmentGranularity": "DAY",
"queryGranularity": "DAY"
}
},
"tuningConfig": {
"type": "kafka",
"maxRowsPerSegment": 2500000,
"resetOffsetAutomatically": true,
"targetPartitionSize": 2500000
},
"ioConfig": {
"topic": "drd-mp-webchat-applet",
"consumerProperties": {
"bootstrap.servers": "kafka-server:9092"
},
"taskCount": 1,
"taskDuration": "PT1H",
"replicas": 1,
"useEarliestOffset": true
}
}
Hi, all
I found a problem when i use kafka index service. The task process uses a lot of direct memory when publishing segments, almost 6x than ingesting data stage.
I'm using druid-0.13.0.
At ingesting time,
RESof the task is 1.647g.And the
heap、non-heap、directare 221M、120M and 864MBut at publishing time,
RESof the task is 6.046gAnd the
heap、non-heap、directare 266M、124M and 5204MThe direct memory increase 864M to 5204M when publishing begins. How can i control the usage of direct memory?
Any suggestion? Thanks!
middleManager runtime.properties
Datasource has 35 dimensions and 45 metrics. The spec file