StatisticsMetricCollector.java

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

package org.apache.doris.statistics;

import org.apache.doris.catalog.Column;
import org.apache.doris.catalog.DatabaseIf;
import org.apache.doris.catalog.Env;
import org.apache.doris.catalog.OlapTable;
import org.apache.doris.catalog.TableIf;
import org.apache.doris.common.Pair;
import org.apache.doris.common.util.MasterDaemon;
import org.apache.doris.datasource.InternalCatalog;
import org.apache.doris.statistics.util.StatisticsUtil;

import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;

import java.util.Set;
import java.util.concurrent.TimeUnit;
import java.util.stream.Collectors;

/**
 * Daemon thread to collect statistics related metrics.
 */
public class StatisticsMetricCollector extends MasterDaemon {

    public static final Logger LOG = LogManager.getLogger(StatisticsMetricCollector.class);

    public static final long INTERVAL = 300;

    private volatile int unhealthyTableCount;
    private volatile int unhealthyColumnCount;
    private volatile int notAnalyzedTableCount;
    private volatile int totalTableCount;
    private volatile int totalColumnCount;
    private volatile int emptyTableCount;

    public StatisticsMetricCollector() {
        super("Statistics Metric Collector", TimeUnit.SECONDS.toMillis(INTERVAL));
    }

    @Override
    protected void runAfterCatalogReady() {
        InternalCatalog catalog = Env.getCurrentInternalCatalog();
        AnalysisManager analysisManager = Env.getCurrentEnv().getAnalysisManager();
        int tmpUnhealthyTableCount = 0;
        int tmpUnhealthyColumnCount = 0;
        int tmpNotAnalyzedTableCount = 0;
        int tmpTotalTableCount = 0;
        int tmpTotalColumnCount = 0;
        int tmpEmptyTableCount = 0;
        for (DatabaseIf<? extends TableIf> db : catalog.getAllDbs()) {
            try {
                if (StatisticConstants.SYSTEM_DBS.contains(db.getFullName())) {
                    continue;
                }
                for (TableIf table : db.getTables()) {
                    try {
                        if (!(table instanceof OlapTable)) {
                            continue;
                        }
                        tmpTotalTableCount += 1;
                        // Get all supported columns, including all indexes.
                        Set<String> columns = table.getSchemaAllIndexes(false)
                                .stream()
                                .filter(c -> !StatisticsUtil.isUnsupportedType(c.getType()))
                                .map(Column::getName)
                                .collect(Collectors.toSet());
                        tmpTotalColumnCount += columns.size();
                        if (table.getRowCount() == 0) {
                            tmpEmptyTableCount += 1;
                        }
                        if (analysisManager.findTableStatsStatus(table.getId()) == null) {
                            tmpNotAnalyzedTableCount += 1;
                        }
                        // Get all unhealthy columns.
                        Set<Pair<String, String>> columnIndexPairs = table.getColumnIndexPairs(columns)
                                .stream().filter(p -> StatisticsUtil.needAnalyzeColumn(table, p))
                                .collect(Collectors.toSet());
                        if (!columnIndexPairs.isEmpty()) {
                            tmpUnhealthyTableCount += 1;
                            tmpUnhealthyColumnCount += columnIndexPairs.size();
                        }
                    } catch (Exception e) {
                        LOG.warn("Failed to get metrics for table {}. Reason {}", table.getName(), e.getMessage());
                    }
                }
            } catch (Exception e) {
                LOG.warn("Failed to get metrics for db {}. Reason {}", db.getFullName(), e.getMessage());
            }
        }
        unhealthyTableCount = tmpUnhealthyTableCount;
        unhealthyColumnCount = tmpUnhealthyColumnCount;
        notAnalyzedTableCount = tmpNotAnalyzedTableCount;
        totalTableCount = tmpTotalTableCount;
        totalColumnCount = tmpTotalColumnCount;
        emptyTableCount = tmpEmptyTableCount;
    }

    public int getUnhealthyTableCount() {
        return unhealthyTableCount;
    }

    public double getUnhealthyTableRate() {
        return (totalTableCount == 0 ? 0 : (double) unhealthyTableCount / totalTableCount) * 100;
    }

    public int getUnhealthyColumnCount() {
        return unhealthyColumnCount;
    }

    public double getUnhealthyColumnRate() {
        return (totalColumnCount == 0 ? 0 : (double) unhealthyColumnCount / totalColumnCount) * 100;
    }

    public int getNotAnalyzedTableCount() {
        return notAnalyzedTableCount;
    }

    public int getEmptyTableCount() {
        return emptyTableCount;
    }
}