Skip to content

Commit bd750cf

Browse files
authored
Merge branch 'branch-2.0' into fix_hudi_scan_lock
2 parents 791c21c + f20aff5 commit bd750cf

File tree

9 files changed

+77
-6
lines changed

9 files changed

+77
-6
lines changed

be/src/common/daemon.cpp

+1
Original file line numberDiff line numberDiff line change
@@ -409,6 +409,7 @@ static void init_doris_metrics(const std::vector<StorePath>& store_paths) {
409409
void signal_handler(int signal) {
410410
if (signal == SIGINT || signal == SIGTERM) {
411411
k_doris_exit = true;
412+
k_doris_start = false;
412413
LOG(INFO) << "doris start to exit";
413414
}
414415
}

be/src/common/daemon.h

+1
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@ namespace doris {
2727

2828
struct StorePath;
2929
inline bool k_doris_exit = false;
30+
inline bool k_doris_start = false;
3031

3132
class Daemon {
3233
public:

be/src/runtime/thread_context.h

+5-4
Original file line numberDiff line numberDiff line change
@@ -100,6 +100,7 @@ class MemTracker;
100100
class RuntimeState;
101101

102102
extern bool k_doris_exit;
103+
extern bool k_doris_start;
103104
extern bthread_key_t btls_key;
104105

105106
// Using gcc11 compiles thread_local variable on lower versions of GLIBC will report an error,
@@ -388,17 +389,17 @@ class AddThreadMemTrackerConsumer {
388389
// which is different from the previous behavior.
389390
#define CONSUME_MEM_TRACKER(size) \
390391
do { \
391-
if (doris::thread_context_ptr.init) { \
392+
if (doris::k_doris_start && doris::thread_context_ptr.init) { \
392393
doris::thread_context()->consume_memory(size); \
393-
} else if (doris::ExecEnv::GetInstance()->initialized()) { \
394+
} else if (doris::k_doris_start && doris::ExecEnv::GetInstance()->initialized()) { \
394395
doris::ExecEnv::GetInstance()->orphan_mem_tracker_raw()->consume_no_update_peak(size); \
395396
} \
396397
} while (0)
397398
#define RELEASE_MEM_TRACKER(size) \
398399
do { \
399-
if (doris::thread_context_ptr.init) { \
400+
if (doris::k_doris_start && doris::thread_context_ptr.init) { \
400401
doris::thread_context()->consume_memory(-size); \
401-
} else if (doris::ExecEnv::GetInstance()->initialized()) { \
402+
} else if (doris::k_doris_start && doris::ExecEnv::GetInstance()->initialized()) { \
402403
doris::ExecEnv::GetInstance()->orphan_mem_tracker_raw()->consume_no_update_peak( \
403404
-size); \
404405
} \

be/src/service/doris_main.cpp

+2
Original file line numberDiff line numberDiff line change
@@ -82,6 +82,7 @@ int __llvm_profile_write_file();
8282

8383
namespace doris {
8484
extern bool k_doris_exit;
85+
extern bool k_doris_start;
8586

8687
static void thrift_output(const char* x) {
8788
LOG(WARNING) << "thrift internal message: " << x;
@@ -463,6 +464,7 @@ int main(int argc, char** argv) {
463464

464465
// init exec env
465466
auto exec_env = doris::ExecEnv::GetInstance();
467+
doris::k_doris_start = true;
466468
doris::ExecEnv::init(exec_env, paths);
467469
doris::TabletSchemaCache::create_global_schema_cache();
468470

fe/fe-core/src/main/java/org/apache/doris/statistics/AnalysisManager.java

+3
Original file line numberDiff line numberDiff line change
@@ -219,6 +219,9 @@ public void createAnalysisJob(AnalyzeTblStmt stmt, boolean proxy) throws DdlExce
219219
}
220220
List<AnalysisInfo> jobs = new ArrayList<>();
221221
autoCollector.createAnalyzeJobForTbl(stmt.getDb(), jobs, stmt.getTable());
222+
if (jobs.isEmpty()) {
223+
return;
224+
}
222225
AnalysisInfo job = autoCollector.getReAnalyzeRequiredPart(jobs.get(0));
223226
if (job != null) {
224227
Env.getCurrentEnv().getStatisticsAutoCollector().createSystemAnalysisJob(job);

fe/fe-core/src/main/java/org/apache/doris/statistics/StatisticsAutoCollector.java

+13-2
Original file line numberDiff line numberDiff line change
@@ -144,7 +144,6 @@ protected List<AnalysisInfo> constructAnalysisInfo(DatabaseIf<? extends TableIf>
144144
} catch (Throwable t) {
145145
LOG.warn("Failed to analyze table {}.{}.{}",
146146
db.getCatalog().getName(), db.getFullName(), table.getName(), t);
147-
continue;
148147
}
149148
}
150149
return analysisInfos;
@@ -186,7 +185,19 @@ protected void createAnalyzeJobForTbl(DatabaseIf<? extends TableIf> db,
186185
return;
187186
}
188187
}
189-
long rowCount = StatisticsUtil.isEmptyTable(table, analysisMethod) ? 0 : table.getRowCount();
188+
// We don't auto analyze empty table to avoid all 0 stats.
189+
// Because all 0 is more dangerous than unknown stats when row count report is delayed.
190+
AnalysisManager manager = Env.getServingEnv().getAnalysisManager();
191+
TableStatsMeta tableStatsStatus = manager.findTableStatsStatus(table.getId());
192+
long rowCount = table.getRowCount();
193+
if (rowCount <= 0) {
194+
LOG.info("Table {} is empty, remove its old stats and skip auto analyze it.", table.getName());
195+
// Remove the table's old stats if exists.
196+
if (tableStatsStatus != null && !tableStatsStatus.isColumnsStatsEmpty()) {
197+
manager.dropStats(table);
198+
}
199+
return;
200+
}
190201
AnalysisInfo jobInfo = new AnalysisInfoBuilder()
191202
.setJobId(Env.getCurrentEnv().getNextId())
192203
.setCatalogId(db.getCatalog().getId())

fe/fe-core/src/main/java/org/apache/doris/statistics/TableStatsMeta.java

+4
Original file line numberDiff line numberDiff line change
@@ -242,4 +242,8 @@ protected void clearStaleIndexRowCount(OlapTable table) {
242242
protected void addIndexRowForTest(long indexId, long rowCount) {
243243
indexesRowCount.put(indexId, rowCount);
244244
}
245+
246+
public boolean isColumnsStatsEmpty() {
247+
return colNameToColStatsMeta == null || colNameToColStatsMeta.isEmpty();
248+
}
245249
}

fe/fe-core/src/test/java/org/apache/doris/statistics/StatisticsAutoCollectorTest.java

+15
Original file line numberDiff line numberDiff line change
@@ -142,6 +142,11 @@ public List<Column> getSchemaAllIndexes(boolean full) {
142142
columns.add(new Column("c2", PrimitiveType.HLL));
143143
return columns;
144144
}
145+
146+
@Mock
147+
public long getRowCount() {
148+
return 1;
149+
}
145150
};
146151
StatisticsAutoCollector saa = new StatisticsAutoCollector();
147152
List<AnalysisInfo> analysisInfoList = saa.constructAnalysisInfo(new Database(1, "anydb"));
@@ -397,6 +402,11 @@ public List<Long> getMvColumnIndexIds(String columnName) {
397402
objects.add(-1L);
398403
return objects;
399404
}
405+
406+
@Mock
407+
public long getRowCount() {
408+
return 1;
409+
}
400410
};
401411

402412
new MockUp<StatisticsUtil>() {
@@ -469,6 +479,11 @@ public List<Long> getMvColumnIndexIds(String columnName) {
469479
objects.add(-1L);
470480
return objects;
471481
}
482+
483+
@Mock
484+
public long getRowCount() {
485+
return 1;
486+
}
472487
};
473488

474489
new MockUp<StatisticsUtil>() {

regression-test/suites/statistics/test_analyze_mv.groovy

+33
Original file line numberDiff line numberDiff line change
@@ -689,6 +689,18 @@ suite("test_analyze_mv") {
689689
assertEquals("0", result_row[0][3])
690690
assertEquals("-1", result_row[0][4])
691691

692+
// ** Embedded test for skip auto analyze when table is empty
693+
sql """analyze table mvTestDup properties ("use.auto.analyzer" = "true")"""
694+
def empty_test = sql """show auto analyze mvTestDup"""
695+
assertEquals(0, empty_test.size())
696+
empty_test = sql """show column stats mvTestDup"""
697+
assertEquals(0, empty_test.size())
698+
// ** End of embedded test
699+
700+
sql """analyze table mvTestDup with sync"""
701+
empty_test = sql """show column stats mvTestDup"""
702+
assertEquals(12, empty_test.size())
703+
692704
for (int i = 0; i < 120; i++) {
693705
result_row = sql """show index stats mvTestDup mv3"""
694706
logger.info("mv3 stats: " + result_row)
@@ -703,6 +715,27 @@ suite("test_analyze_mv") {
703715
assertEquals("mv3", result_row[0][1])
704716
assertEquals("0", result_row[0][3])
705717
assertEquals("0", result_row[0][4])
718+
719+
// ** Embedded test for skip auto analyze when table is empty again
720+
sql """analyze table mvTestDup properties ("use.auto.analyzer" = "true")"""
721+
empty_test = sql """show auto analyze mvTestDup"""
722+
assertEquals(0, empty_test.size())
723+
empty_test = sql """show column stats mvTestDup"""
724+
for (int i = 0; i < 100; i++) {
725+
empty_test = sql """show column stats mvTestDup"""
726+
if (empty_test.size() != 0) {
727+
logger.info("async delete is not finished yet.")
728+
Thread.sleep(1000)
729+
}
730+
break
731+
}
732+
assertEquals(0, empty_test.size())
733+
// ** End of embedded test
734+
735+
sql """analyze table mvTestDup with sync"""
736+
empty_test = sql """show column stats mvTestDup"""
737+
assertEquals(12, empty_test.size())
738+
706739
sql """insert into mvTestDup values (1, 2, 3, 4, 5), (1, 2, 3, 4, 5), (10, 20, 30, 40, 50), (10, 20, 30, 40, 50), (100, 200, 300, 400, 500), (1001, 2001, 3001, 4001, 5001);"""
707740
result_row = sql """show index stats mvTestDup mv3"""
708741
assertEquals(1, result_row.size())

0 commit comments

Comments
 (0)