We just setup openTSDB on top of an AWS EMR HBase Cluster with Grafana querying it.
We are noticing that the dashboard queries are taking minutes to load.
Looking for general guidance on what openTSDB metrics or HBase Metrics to troubleshoot the issue.
* We see a high cache eviction rate -- wondering if this is an indication that the cache is to small or just could be expiring data TTL
* We see that the tsd.hbase.latency from 50% to 95% related to SCANS is really high at 2147483647ms
"tsd.core.auto_create_metrics":"true",
"tsd.core.auto_create_tagks":"true",
"tsd.core.auto_create_tagvs":"true",
"tsd.core.connections.limit":"0",
"tsd.core.enable_api":"true",
"tsd.core.enable_ui":"true",
"tsd.core.meta.cache.enable":"false",
"tsd.core.meta.enable_realtime_ts":"false",
"tsd.core.meta.enable_realtime_uid":"false",
"tsd.core.meta.enable_tsuid_incrementing":"false",
"tsd.core.meta.enable_tsuid_tracking":"false",
"tsd.core.plugin_path":"/usr/share/opentsdb/plugins",
"tsd.core.preload_uid_cache":"false",
"tsd.core.preload_uid_cache.max_entries":"300000",
"tsd.core.socket.timeout":"0",
"tsd.core.stats_with_port":"false",
"tsd.core.storage_exception_handler.enable":"false",
"tsd.core.tree.enable_processing":"false",
"tsd.core.uid.random_metrics":"false",
"tsd.http.cachedir":"/tmp/opentsdb",
"tsd.http.query.allow_delete":"false",
"tsd.http.request.cors_domains":"",
"tsd.http.request.cors_headers":"Authorization, Content-Type, Accept, Origin, User-Agent, DNT, Cache-Control, X-Mx-ReqToken, Keep-Alive, X-Requested-With, If-Modified-Since",
"tsd.http.request.enable_chunked":"false",
"tsd.http.request.max_chunk":"4096",
"tsd.http.show_stack_trace":"true",
"tsd.http.staticroot":"/usr/share/opentsdb/static/",
"tsd.mode":"ro",
"tsd.network.async_io":"true",
"tsd.network.bind":"0.0.0.0",
"tsd.network.keep_alive":"true",
"tsd.network.port":"hidden",
"tsd.network.reuse_address":"true",
"tsd.network.tcp_no_delay":"true",
"tsd.network.worker_threads":"",
"tsd.no_diediedie":"false",
"tsd.query.allow_simultaneous_duplicates":"true",
"tsd.query.enable_fuzzy_filter":"true",
"tsd.query.filter.expansion_limit":"4096",
"tsd.query.skip_unresolved_tagvs":"false",
"tsd.query.timeout":"0",
"tsd.rtpublisher.enable":"false",
"tsd.rtpublisher.plugin":"",
"tsd.search.enable":"false",
"tsd.search.plugin":"",
"tsd.startup.enable":"false",
"tsd.startup.plugin":"",
"tsd.stats.canonical":"false",
"tsd.storage.compaction.flush_interval":"10",
"tsd.storage.compaction.flush_speed":"2",
"tsd.storage.compaction.max_concurrent_flushes":"10000",
"tsd.storage.compaction.min_flush_threshold":"100",
"tsd.storage.enable_appends":"false",
"tsd.storage.enable_compaction":"false",
"tsd.storage.fix_duplicates":"true",
"tsd.storage.flush_interval":"1000",
"tsd.storage.hbase.data_table":"tsdb",
"tsd.storage.hbase.meta_table":"tsdb-meta",
"tsd.storage.hbase.prefetch_meta":"false",
"tsd.storage.hbase.scanner.maxNumRows":"128",
"tsd.storage.hbase.tree_table":"tsdb-tree",
"tsd.storage.hbase.uid_table":"tsdb-uid",
"tsd.storage.hbase.zk_basedir":"/hbase",
"tsd.storage.hbase.zk_quorum":"ip-<ip address>.ec2.internal",
"tsd.storage.repair_appends":"false",
"tsd.storage.salt.buckets":"7",
"tsd.storage.salt.width":"1",
"tsd.timeseriesfilter.enable":"false",
"tsd.uidfilter.enable":"false"}
Any general guidance for troubleshooting or performance tuning would be appreciated.