Skip to content

Commit

Permalink
[AMORO-405]: Added overview page in AMS dashboard (#3031)
Browse files Browse the repository at this point in the history
* add overview page

* Update the style of SingleDataCard MultipleDataCard

* Implementing cards basic styles

* add OverviewController

* get sum of tables sizes

* add pieChartCard、TableHealthCard、UserHistoryCard

* update the visual design of the overview page

* format code

* add mock data for Optimizing Status, Summary Cards, Table Format

* get overview summary

* add overview optimizing status and overview format api

* fix memory unit

* fix imports

* add listTableMetas method to TableService

* front-end of the UnhealthTablesCard and OperationsCard

* Formatting Code,i18

* add unhealthTables and latestOperations API

* update unhealth tables api and format code

* restore pnpm-lock.yaml

* Optimize and clean up code

* implements OverviewMetricsReporter

* move OverviewMetricsReporter to ams-server

* fix unit and i18 bug

* fix unit bug

* fix overview getTableFormat bug

* add resource api

* added idle&committing for OptimizerGroupMetrics

* update design for overview page

* update resource usage api

* implement overviewSummary/dataSize api

* fixed unit bug

* move overview page

* add overview cache unit test

* update format and i18n

* show health score on overview page

* Remove introduce page,and format code

---------

Co-authored-by: ZhouJinsong <[email protected]>
  • Loading branch information
MarigWeizhi and zhoujinsong authored Sep 12, 2024
1 parent d4ea2fa commit f541d6f
Show file tree
Hide file tree
Showing 33 changed files with 1,935 additions and 485 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,7 @@
import org.apache.amoro.server.dashboard.controller.HealthCheckController;
import org.apache.amoro.server.dashboard.controller.LoginController;
import org.apache.amoro.server.dashboard.controller.OptimizerController;
import org.apache.amoro.server.dashboard.controller.OverviewController;
import org.apache.amoro.server.dashboard.controller.PlatformFileInfoController;
import org.apache.amoro.server.dashboard.controller.SettingController;
import org.apache.amoro.server.dashboard.controller.TableController;
Expand Down Expand Up @@ -82,6 +83,7 @@ public class DashboardServer {
private final TableController tableController;
private final TerminalController terminalController;
private final VersionController versionController;
private final OverviewController overviewController;

private final String authType;
private final String basicAuthUser;
Expand All @@ -103,6 +105,7 @@ public DashboardServer(
this.tableController = new TableController(tableService, tableDescriptor, serviceConfig);
this.terminalController = new TerminalController(terminalManager);
this.versionController = new VersionController();
this.overviewController = new OverviewController();

this.authType = serviceConfig.get(AmoroManagementConf.HTTP_SERVER_REST_AUTH_TYPE);
this.basicAuthUser = serviceConfig.get(AmoroManagementConf.ADMIN_USERNAME);
Expand Down Expand Up @@ -327,6 +330,17 @@ private EndpointGroup apiGroup() {

// version api
get("/versionInfo", versionController::getVersionInfo);

// overview apis
path(
"/overview",
() -> {
get("/summary", overviewController::getSummary);
get("/resource", overviewController::getResourceUsageHistory);
get("/optimizing", overviewController::getOptimizingStatus);
get("/dataSize", overviewController::getDataSizeHistory);
get("/top", overviewController::getTopTables);
});
};
}

Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,302 @@
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package org.apache.amoro.server.dashboard;

import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_COMMITTING_TABLES;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_EXECUTING_TABLES;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_IDLE_TABLES;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_MEMORY_BYTES_ALLOCATED;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_PENDING_TABLES;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_PLANING_TABLES;
import static org.apache.amoro.server.optimizing.OptimizerGroupMetrics.OPTIMIZER_GROUP_THREADS;
import static org.apache.amoro.server.table.TableSummaryMetrics.TABLE_SUMMARY_HEALTH_SCORE;
import static org.apache.amoro.server.table.TableSummaryMetrics.TABLE_SUMMARY_TOTAL_FILES;
import static org.apache.amoro.server.table.TableSummaryMetrics.TABLE_SUMMARY_TOTAL_FILES_SIZE;

import org.apache.amoro.metrics.Counter;
import org.apache.amoro.metrics.Gauge;
import org.apache.amoro.metrics.Metric;
import org.apache.amoro.metrics.MetricDefine;
import org.apache.amoro.metrics.MetricKey;
import org.apache.amoro.metrics.MetricSet;
import org.apache.amoro.server.dashboard.model.OverviewDataSizeItem;
import org.apache.amoro.server.dashboard.model.OverviewResourceUsageItem;
import org.apache.amoro.server.dashboard.model.OverviewTopTableItem;
import org.apache.amoro.shade.guava32.com.google.common.collect.ImmutableList;
import org.apache.amoro.shade.guava32.com.google.common.collect.Maps;
import org.apache.amoro.shade.guava32.com.google.common.collect.Sets;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.util.ArrayList;
import java.util.Deque;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentLinkedDeque;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;
import java.util.function.Function;
import java.util.stream.Collectors;

public class OverviewCache {

public static final String STATUS_PENDING = "Pending";
public static final String STATUS_PLANING = "Planing";
public static final String STATUS_EXECUTING = "Executing";
public static final String STATUS_IDLE = "Idle";
public static final String STATUS_COMMITTING = "Committing";

private static final Logger LOG = LoggerFactory.getLogger(OverviewCache.class);

private volatile List<OverviewTopTableItem> allTopTableItem = new ArrayList<>();
private final Map<String, Long> optimizingStatusCountMap = new ConcurrentHashMap<>();
private final ConcurrentLinkedDeque<OverviewResourceUsageItem> resourceUsageHistory =
new ConcurrentLinkedDeque<>();
private final ConcurrentLinkedDeque<OverviewDataSizeItem> dataSizeHistory =
new ConcurrentLinkedDeque<>();
private final AtomicInteger totalCatalog = new AtomicInteger();
private final AtomicLong totalDataSize = new AtomicLong();
private final AtomicInteger totalTableCount = new AtomicInteger();
private final AtomicInteger totalCpu = new AtomicInteger();
private final AtomicLong totalMemory = new AtomicLong();

private MetricSet metricSet;
private int maxRecordCount;
private static volatile OverviewCache INSTANCE;

private OverviewCache() {}

/** @return Get the singleton object. */
public static OverviewCache getInstance() {
if (INSTANCE == null) {
synchronized (OverviewCache.class) {
if (INSTANCE == null) {
INSTANCE = new OverviewCache();
}
}
}
return INSTANCE;
}

public void initialize(int maxRecordCount, MetricSet globalMetricSet) {
this.maxRecordCount = maxRecordCount;
this.metricSet = globalMetricSet;
}

public List<OverviewTopTableItem> getAllTopTableItem() {
return ImmutableList.copyOf(allTopTableItem);
}

public int getTotalCatalog() {
return totalCatalog.get();
}

public int getTotalTableCount() {
return totalTableCount.get();
}

public long getTotalDataSize() {
return totalDataSize.get();
}

public int getTotalCpu() {
return totalCpu.get();
}

public long getTotalMemory() {
return totalMemory.get();
}

public List<OverviewResourceUsageItem> getResourceUsageHistory(long startTime) {
return resourceUsageHistory.stream()
.filter(item -> item.getTs() >= startTime)
.collect(Collectors.toList());
}

public List<OverviewDataSizeItem> getDataSizeHistory(long startTime) {
return dataSizeHistory.stream()
.filter(item -> item.getTs() >= startTime)
.collect(Collectors.toList());
}

public Map<String, Long> getOptimizingStatus() {
return optimizingStatusCountMap;
}

public void refresh() {
long start = System.currentTimeMillis();
LOG.info("Updating overview cache");
try {
// Already registered metrics may change,
// so the metricDefineMap needs to be recalculated at each refresh
Map<MetricDefine, List<MetricKey>> metricDefineMap =
metricSet.getMetrics().keySet().stream()
.collect(
Collectors.groupingBy(
MetricKey::getDefine,
Collectors.mapping(Function.identity(), Collectors.toList())));

updateResourceUsage(start, metricDefineMap);
updateTableDetail(start, metricDefineMap);
updateOptimizingStatus(metricDefineMap);

} catch (Exception e) {
LOG.error("OverviewRefresher error", e);
} finally {
long end = System.currentTimeMillis();
LOG.info("Refresher overview cache took {} ms.", end - start);
}
}

private void updateResourceUsage(long ts, Map<MetricDefine, List<MetricKey>> metricDefineMap) {
int optimizerGroupThreadCount =
(int) sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_THREADS);
long optimizerGroupMemoryBytes =
sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_MEMORY_BYTES_ALLOCATED);

this.totalCpu.set(optimizerGroupThreadCount);
this.totalMemory.set(optimizerGroupMemoryBytes);
addAndCheck(
new OverviewResourceUsageItem(ts, optimizerGroupThreadCount, optimizerGroupMemoryBytes));
}

private void updateTableDetail(long ts, Map<MetricDefine, List<MetricKey>> metricDefineMap) {
Map<String, OverviewTopTableItem> topTableItemMap = Maps.newHashMap();
Set<String> allCatalogs = Sets.newHashSet();
Map<MetricKey, Metric> registeredMetrics = metricSet.getMetrics();
long totalTableSize = 0L;

// table size
List<MetricKey> metricKeys = metricDefineMap.get(TABLE_SUMMARY_TOTAL_FILES_SIZE);
for (MetricKey metricKey : metricKeys) {
String tableName = fullTableName(metricKey);
allCatalogs.add(catalog(metricKey));
OverviewTopTableItem tableItem =
topTableItemMap.computeIfAbsent(tableName, ignore -> new OverviewTopTableItem(tableName));
long tableSize = covertValue(registeredMetrics.get(metricKey));
tableItem.setTableSize(tableSize);
totalTableSize += tableSize;
}

// file count
metricKeys = metricDefineMap.get(TABLE_SUMMARY_TOTAL_FILES);
for (MetricKey metricKey : metricKeys) {
String tableName = fullTableName(metricKey);
allCatalogs.add(catalog(metricKey));
OverviewTopTableItem tableItem =
topTableItemMap.computeIfAbsent(tableName, ignore -> new OverviewTopTableItem(tableName));
int fileCount = (int) covertValue(registeredMetrics.get(metricKey));
tableItem.setFileCount(fileCount);
tableItem.setAverageFileSize(fileCount == 0 ? 0 : tableItem.getTableSize() / fileCount);
}

// health score
metricKeys = metricDefineMap.get(TABLE_SUMMARY_HEALTH_SCORE);
for (MetricKey metricKey : metricKeys) {
String tableName = fullTableName(metricKey);
allCatalogs.add(catalog(metricKey));
OverviewTopTableItem tableItem =
topTableItemMap.computeIfAbsent(tableName, ignore -> new OverviewTopTableItem(tableName));
int healthScore = (int) covertValue(registeredMetrics.get(metricKey));
tableItem.setHealthScore(healthScore);
}

this.totalDataSize.set(totalTableSize);
this.totalCatalog.set(allCatalogs.size());
this.totalTableCount.set(metricKeys.size());
this.allTopTableItem = new ArrayList<>(topTableItemMap.values());
addAndCheck(new OverviewDataSizeItem(ts, totalTableSize));
}

private void updateOptimizingStatus(Map<MetricDefine, List<MetricKey>> metricDefineMap) {
optimizingStatusCountMap.put(
STATUS_PENDING, sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_PENDING_TABLES));
optimizingStatusCountMap.put(
STATUS_PLANING, sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_PLANING_TABLES));
optimizingStatusCountMap.put(
STATUS_EXECUTING,
sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_EXECUTING_TABLES));
optimizingStatusCountMap.put(
STATUS_IDLE, sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_IDLE_TABLES));
optimizingStatusCountMap.put(
STATUS_COMMITTING,
sumMetricValuesByDefine(metricDefineMap, OPTIMIZER_GROUP_COMMITTING_TABLES));
}

private void addAndCheck(OverviewDataSizeItem dataSizeItem) {
dataSizeHistory.add(dataSizeItem);
checkSize(dataSizeHistory);
}

private void addAndCheck(OverviewResourceUsageItem resourceUsageItem) {
resourceUsageHistory.add(resourceUsageItem);
checkSize(resourceUsageHistory);
}

private <T> void checkSize(Deque<T> deque) {
if (deque.size() > maxRecordCount) {
deque.poll();
}
}

private String fullTableName(MetricKey metricKey) {
return catalog(metricKey)
.concat(".")
.concat(database(metricKey))
.concat(".")
.concat(table(metricKey));
}

private String catalog(MetricKey metricKey) {
return metricKey.valueOfTag("catalog");
}

private String database(MetricKey metricKey) {
return metricKey.valueOfTag("database");
}

private String table(MetricKey metricKey) {
return metricKey.valueOfTag("table");
}

private long sumMetricValuesByDefine(
Map<MetricDefine, List<MetricKey>> metricDefineMap, MetricDefine metricDefine) {
List<MetricKey> metricKeys = metricDefineMap.get(metricDefine);
if ((metricKeys == null)) {
return 0;
}
return metricKeys.stream()
.map(metricKey -> covertValue(metricSet.getMetrics().get(metricKey)))
.mapToLong(Long::longValue)
.sum();
}

private long covertValue(Metric metric) {
if (metric instanceof Counter) {
return ((Counter) metric).getCount();
} else if (metric instanceof Gauge) {
return ((Gauge<?>) metric).getValue().longValue();
} else {
throw new IllegalStateException(
"unknown metric implement class:" + metric.getClass().getName());
}
}
}
Loading

0 comments on commit f541d6f

Please sign in to comment.