Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[improvement](statistics)Skip auto analyze empty table. (#43865) #44045

Merged
merged 1 commit into from
Nov 16, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -219,6 +219,9 @@ public void createAnalysisJob(AnalyzeTblStmt stmt, boolean proxy) throws DdlExce
}
List<AnalysisInfo> jobs = new ArrayList<>();
autoCollector.createAnalyzeJobForTbl(stmt.getDb(), jobs, stmt.getTable());
if (jobs.isEmpty()) {
return;
}
AnalysisInfo job = autoCollector.getReAnalyzeRequiredPart(jobs.get(0));
if (job != null) {
Env.getCurrentEnv().getStatisticsAutoCollector().createSystemAnalysisJob(job);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -144,7 +144,6 @@ protected List<AnalysisInfo> constructAnalysisInfo(DatabaseIf<? extends TableIf>
} catch (Throwable t) {
LOG.warn("Failed to analyze table {}.{}.{}",
db.getCatalog().getName(), db.getFullName(), table.getName(), t);
continue;
}
}
return analysisInfos;
Expand Down Expand Up @@ -186,7 +185,19 @@ protected void createAnalyzeJobForTbl(DatabaseIf<? extends TableIf> db,
return;
}
}
long rowCount = StatisticsUtil.isEmptyTable(table, analysisMethod) ? 0 : table.getRowCount();
// We don't auto analyze empty table to avoid all 0 stats.
// Because all 0 is more dangerous than unknown stats when row count report is delayed.
AnalysisManager manager = Env.getServingEnv().getAnalysisManager();
TableStatsMeta tableStatsStatus = manager.findTableStatsStatus(table.getId());
long rowCount = table.getRowCount();
if (rowCount <= 0) {
LOG.info("Table {} is empty, remove its old stats and skip auto analyze it.", table.getName());
// Remove the table's old stats if exists.
if (tableStatsStatus != null && !tableStatsStatus.isColumnsStatsEmpty()) {
manager.dropStats(table);
}
return;
}
AnalysisInfo jobInfo = new AnalysisInfoBuilder()
.setJobId(Env.getCurrentEnv().getNextId())
.setCatalogId(db.getCatalog().getId())
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -242,4 +242,8 @@ protected void clearStaleIndexRowCount(OlapTable table) {
protected void addIndexRowForTest(long indexId, long rowCount) {
indexesRowCount.put(indexId, rowCount);
}

public boolean isColumnsStatsEmpty() {
return colNameToColStatsMeta == null || colNameToColStatsMeta.isEmpty();
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -142,6 +142,11 @@ public List<Column> getSchemaAllIndexes(boolean full) {
columns.add(new Column("c2", PrimitiveType.HLL));
return columns;
}

@Mock
public long getRowCount() {
return 1;
}
};
StatisticsAutoCollector saa = new StatisticsAutoCollector();
List<AnalysisInfo> analysisInfoList = saa.constructAnalysisInfo(new Database(1, "anydb"));
Expand Down Expand Up @@ -397,6 +402,11 @@ public List<Long> getMvColumnIndexIds(String columnName) {
objects.add(-1L);
return objects;
}

@Mock
public long getRowCount() {
return 1;
}
};

new MockUp<StatisticsUtil>() {
Expand Down Expand Up @@ -469,6 +479,11 @@ public List<Long> getMvColumnIndexIds(String columnName) {
objects.add(-1L);
return objects;
}

@Mock
public long getRowCount() {
return 1;
}
};

new MockUp<StatisticsUtil>() {
Expand Down
33 changes: 33 additions & 0 deletions regression-test/suites/statistics/test_analyze_mv.groovy
Original file line number Diff line number Diff line change
Expand Up @@ -689,6 +689,18 @@ suite("test_analyze_mv") {
assertEquals("0", result_row[0][3])
assertEquals("-1", result_row[0][4])

// ** Embedded test for skip auto analyze when table is empty
sql """analyze table mvTestDup properties ("use.auto.analyzer" = "true")"""
def empty_test = sql """show auto analyze mvTestDup"""
assertEquals(0, empty_test.size())
empty_test = sql """show column stats mvTestDup"""
assertEquals(0, empty_test.size())
// ** End of embedded test

sql """analyze table mvTestDup with sync"""
empty_test = sql """show column stats mvTestDup"""
assertEquals(12, empty_test.size())

for (int i = 0; i < 120; i++) {
result_row = sql """show index stats mvTestDup mv3"""
logger.info("mv3 stats: " + result_row)
Expand All @@ -703,6 +715,27 @@ suite("test_analyze_mv") {
assertEquals("mv3", result_row[0][1])
assertEquals("0", result_row[0][3])
assertEquals("0", result_row[0][4])

// ** Embedded test for skip auto analyze when table is empty again
sql """analyze table mvTestDup properties ("use.auto.analyzer" = "true")"""
empty_test = sql """show auto analyze mvTestDup"""
assertEquals(0, empty_test.size())
empty_test = sql """show column stats mvTestDup"""
for (int i = 0; i < 100; i++) {
empty_test = sql """show column stats mvTestDup"""
if (empty_test.size() != 0) {
logger.info("async delete is not finished yet.")
Thread.sleep(1000)
}
break
}
assertEquals(0, empty_test.size())
// ** End of embedded test

sql """analyze table mvTestDup with sync"""
empty_test = sql """show column stats mvTestDup"""
assertEquals(12, empty_test.size())

sql """insert into mvTestDup values (1, 2, 3, 4, 5), (1, 2, 3, 4, 5), (10, 20, 30, 40, 50), (10, 20, 30, 40, 50), (100, 200, 300, 400, 500), (1001, 2001, 3001, 4001, 5001);"""
result_row = sql """show index stats mvTestDup mv3"""
assertEquals(1, result_row.size())
Expand Down
Loading