diff --git a/.nojekyll b/.nojekyll new file mode 100644 index 0000000..e69de29 diff --git a/README.md b/README.md index ce9534c..6e29b91 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,5 @@ +Visit **[dbhammer.github.io](https://dbhammer.github.io)** 🚀 +

DBHammer

Lab Website Template diff --git a/_cite/.cache/cache.db b/_cite/.cache/cache.db index 13e939b..fd5a713 100644 Binary files a/_cite/.cache/cache.db and b/_cite/.cache/cache.db differ diff --git a/_config.yaml b/_config.yaml index 42aeeba..7f67a69 100644 --- a/_config.yaml +++ b/_config.yaml @@ -16,8 +16,8 @@ links: orcid: 0000-0002-5182-2093 google-scholar: iJtZsaQAAAAJ github: dbhammer - twitter: YourLabHandle - youtube: YourLabChannel + # twitter: YourLabHandle + # youtube: YourLabChannel ### jekyll settings diff --git a/_data/citations.yaml b/_data/citations.yaml index 524a6d3..0e483e3 100644 --- a/_data/citations.yaml +++ b/_data/citations.yaml @@ -1,1168 +1,247 @@ -- id: "Hyper: Hybrid Physical Design Advisor with Multi-agent Reinforcement Learning" - manual: true - title: "Hyper: Hybrid Physical Design Advisor with Multi-agent Reinforcement Learning" - link: - authors: - - Zhicheng Pan - - Y Zhang - - Chengcheng Yang - - A Ghazal - - Rong Zhang - - Huiqi Hu - - X Wu - - Y Dong - - Xuan Zhou - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2025-01-01' -- id: "Artemis: A Customizable Workload Generation Toolkit for Benchmarking Cardinality Estimation " - manual: true - title: "Artemis: A Customizable Workload Generation Toolkit for Benchmarking Cardinality Estimation " - link: - authors: - - Zirui Hu - - Rong Zhang - - Chengcheng Yang - - Xuan Zhou - - Quanqing Xu - - Chuanhui Yang - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2025-01-01' -- id: "Benchmarking Distributed Transactional Database Systems" - manual: true - title: "Benchmarking Distributed Transactional Database Systems" - link: none - authors: - - Hailin He - - Siyang Weng - - Huidong Zhang - - Rong Zhang - - Xuan Zhou - publisher: BenchCouncil Transactions on Benchmarks, Standards and Evaluations - date: '2024-10-01' -- id: "DBStorm: Generating Various Effective Workloads for Testing Isolation Levels" - manual: true - title: "DBStorm: Generating Various Effective Workloads for Testing Isolation Levels" - link: https://2024.issta.org/details/issta-2024-papers/61/DBStorm-Generating-Various-Effective-Workloads-for-Testing-Isolation-Levels - authors: - - Keqiang Li - - Siyang Weng - - Lyu Ni - - Chengcheng Yang - - Rong Zhang - - Xuan Zhou - - Aoying Zhou - publisher: International Symposium on Software Testing and Analysis (ISSTA) - date: '2024-07-16' -- id: "Mirage: Generating Enormous Databases for Complex Workloads" - manual: true - title: "Mirage: Generating Enormous Databases for Complex Workloads" - link: https://www.computer.org/csdl/proceedings-article/icde/2024/171500d989/1YOtBpuCaTS - authors: - - Qingshuai Wang - - Hao Li - - Zirui Hu - - Rong Zhang - - Chengcheng Yang - - Peng Cai - - Xuan Zhou - - Aoying Zhou - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2024-03-20' -- id: "Functionality-Aware Database Tuning via Multi-Task Learning" - manual: true - title: "Functionality-Aware Database Tuning via Multi-Task Learning" - authors: - - Zhongwei Yue - - Shujian Peng - - Peng Cai - - Xuan Zhou - - Huiqi Hu - - Rong Zhang - - Quanqing Xu - - Chuanhui Yang - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2024-03-19' -- id: "SPQO: Learning to Safely Reuse Cached Plans for Dynamic Workloads" - manual: true - title: "SPQO: Learning to Safely Reuse Cached Plans for Dynamic Workloads" - authors: - - Sijia Li - - Peng Cai - - Yiqi Shen - - Huiqi Hu - - Rong Zhang - - Xuan Zhou - - Quanqing Xu - - Chuanhui Yang - publisher: Database Systems for Advanced Applications (DASFAA) - date: '2024-03-17' -- id: "Touchstone+ : Query Aware Database Generation for Match Operators" - manual: true - title: "Touchstone+ : Query Aware Database Generation for Match Operators" - link: https://link.springer.com/chapter/10.1007/978-981-97-5552-3_18 - authors: - - Hao Li - - Qingshuai Wang - - Zirui Hu - - Xuhua Huang - - Lv Ni - - Rong Zhang - - Xuan Zhou - - Quanqing Xu - publisher: Database Systems for Advanced Applications (DASFAA) - date: '2024-03-18' -- id: 'Lauca: A Workload Duplicator for Benchmarking Transactional Database Performance' - manual: true - title: 'Lauca: A Workload Duplicator for Benchmarking Transactional Database Performance' - link: https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=&arnumber=10416761 - authors: - - Siyang Weng - - Qingshuai Wang - - Luyi Qu - - Rong Zhang - - Peng cai - - Weining Qian - - Aoying Zhou - publisher: IEEE Transactions on Knowledge and Data Engineering (TKDE) - date: '2024-02-21' -- id: 'Leopard: A General Test Suite for Isolation Level Verification' - manual: true - title: 'Leopard: A General Test Suite for Isolation Level Verification' - link: https://www.cidrdb.org/cidr2024/papers/p44-liu.pdf - authors: - - Peiyuan Liu - - Siyang Weng - - Keqiang Li - - Lyu Ni - - Chengcheng Yang - - Rong Zhang - - Weining Qian - - Dian Qiao - publisher: International Conference on Innovative Data Systems Research (CIDR) - date: '2024-01-17' -- id: 'Dike: A Benchmark Suite for Distributed Transactional Databases' - manual: true - title: 'Dike: A Benchmark Suite for Distributed Transactional Databases' - link: https://dl.acm.org/doi/abs/10.1145/3555041.3589710 - authors: - - Huidong Zhang - - Luyi Qu - - Qingshuai Wang - - Rong Zhang - - Peng Cai - - Quanqing Xu - - Zhifeng Yang - - Chuanhui Yang - publisher: ACM SIGMOD/PODS International Conference on Management of Data (SIGMOD) - date: '2023-01-01' -- id: 'Workload-Aware Log-Structured Merge Key-Value Store for NVM-SSD Hybrid Storage' - manual: true - title: 'Workload-Aware Log-Structured Merge Key-Value Store for NVM-SSD Hybrid Storage' - link: https://ieeexplore.ieee.org/document/10184519 - authors: - - Lixiang Chen - - Ruihao Chen - - Chengcheng Yang - - Yuxing Han - - Rong Zhang - - Xuan Zhou - - Peiquan Jin - - Weining Qian - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2023-01-01' -- id: 'An Optimized Solution for Highly Contended Transactional Workloads' - manual: true - title: 'An Optimized Solution for Highly Contended Transactional Workloads' - link: https://link.springer.com/chapter/10.1007/978-981-99-8664-4_23 - authors: - - Chunxi Zhang - - Shuyan Zhang - - Ting Chen - - Rong Zhang - - Kai Liu - publisher: International Symposium on Dependable Software Engineering:Theories, Tools, and Applications (SETTA) - date: '2023-01-01' -- id: 'Leopard: A Black-Box Approach for Efficiently Verifying Various Isolation Levels' - manual: true - title: 'Leopard: A Black-Box Approach for Efficiently Verifying Various Isolation Levels' - link: https://ieeexplore.ieee.org/document/10184872 - authors: - - Keqiang Li - - Siyang Weng - - Peiyuan Liu - - Lyu Ni - - Chengcheng Yang - - Rong Zhang - - Xuan Zhou - - Jianghang Lou - - Gui Huang - - Weining Qian - - Aoying Zhou - publisher: IEEE International Conference on Data Engineering (ICDE) - date: '2023-01-01' -- id: 'A Scalable Query-Aware Enormous Database Generator for Database Evaluation' - title: A Scalable Query-Aware Enormous Database Generator for Database Evaluation - link: https://ieeexplore.ieee.org/document/9720100 - authors: - - Qingshuai Wang - - Yuming Li - - Rong Zhang - - Ke Shu - - Zhenjie Zhang - - Aoying Zhou - publisher: IEEE Transactions on Knowledge and Data Engineering (TKDE) - date: '2022-01-01' - link: https://doi.org/gppmbf - image: /illustration/paper.touchstone.2.png - extra-links: +# DO NOT EDIT, GENERATED AUTOMATICALLY + +- id: doi:10.1093/nar/gkad1082 + title: "The Monarch Initiative in 2024: an analytic platform integrating phenotypes,\ + \ genes\_and diseases across species" + authors: + - Tim E Putman + - Kevin Schaper + - Nicolas Matentzoglu + - "Vincent\_P Rubinetti" + - "Faisal\_S Alquaddoomi" + - Corey Cox + - J Harry Caufield + - Glass Elsarboukh + - Sarah Gehrke + - Harshad Hegde + - "Justin\_T Reese" + - Ian Braun + - "Richard\_M Bruskiewich" + - Luca Cappelletti + - Seth Carbon + - "Anita\_R Caron" + - "Lauren\_E Chan" + - "Christopher\_G Chute" + - "Katherina\_G Cortes" + - "Vin\xEDcius De\_Souza" + - Tommaso Fontana + - "Nomi\_L Harris" + - "Emily\_L Hartley" + - Eric Hurwitz + - "Julius\_O B Jacobsen" + - Madan Krishnamurthy + - "Bryan\_J Laraway" + - "James\_A McLaughlin" + - "Julie\_A McMurry" + - "Sierra\_A T Moxon" + - "Kathleen\_R Mullen" + - "Shawn\_T O\u2019Neil" + - "Kent\_A Shefchek" + - Ray Stefancsik + - Sabrina Toro + - "Nicole\_A Vasilevsky" + - "Ramona\_L Walls" + - "Patricia\_L Whetzel" + - David Osumi-Sutherland + - Damian Smedley + - "Peter\_N Robinson" + - "Christopher\_J Mungall" + - "Melissa\_A Haendel" + - "Monica\_C Munoz-Torres" + publisher: Nucleic Acids Research + date: '2023-11-24' + link: https://doi.org/gs6kmr + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1101/2023.10.11.560955 + title: Integration of 168,000 samples reveals global patterns of the human gut microbiome + authors: + - Richard J. Abdill + - Samantha P. Graham + - Vincent Rubinetti + - Frank W. Albert + - Casey S. Greene + - Sean Davis + - Ran Blekhman + publisher: Cold Spring Harbor Laboratory + date: '2023-10-11' + link: https://doi.org/gsvf5z + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1093/nar/gkad289 + title: 'MyGeneset.info: an interactive and programmatic platform for community-curated + and user-created collections of genes' + authors: + - Ricardo Avila + - Vincent Rubinetti + - Xinghua Zhou + - Dongbo Hu + - Zhongchao Qian + - Marco Alvarado Cano + - Everaldo Rodolpho + - Ginger Tsueng + - Casey Greene + - Chunlei Wu + publisher: Nucleic Acids Research + date: '2023-04-18' + link: https://doi.org/gr5hb5 + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1101/2023.01.05.522941 + title: Hetnet connectivity search provides rapid insights into how two biomedical + entities are related + authors: + - Daniel S. Himmelstein + - Michael Zietz + - Vincent Rubinetti + - Kyle Kloster + - Benjamin J. Heil + - Faisal Alquaddoomi + - Dongbo Hu + - David N. Nicholson + - Yun Hao + - Blair D. Sullivan + - Michael W. Nagle + - Casey S. Greene + publisher: Cold Spring Harbor Laboratory + date: '2023-01-07' + link: https://doi.org/grmcb9 + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1093/gigascience/giad047 + title: Hetnet connectivity search provides rapid insights into how biomedical entities + are related + authors: + - Daniel S Himmelstein + - Michael Zietz + - Vincent Rubinetti + - Kyle Kloster + - Benjamin J Heil + - Faisal Alquaddoomi + - Dongbo Hu + - David N Nicholson + - Yun Hao + - Blair D Sullivan + - Michael W Nagle + - Casey S Greene + publisher: GigaScience + date: '2022-12-28' + link: https://doi.org/gsd85n + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1101/2022.02.18.461833 + title: 'MolEvolvR: A web-app for characterizing proteins using molecular evolution + and phylogeny' + authors: + - Jacob D Krol + - Joseph T Burke + - Samuel Z Chen + - Lo M Sosinski + - Faisal S Alquaddoomi + - Evan P Brenner + - Ethan P Wolfe + - Vincent P Rubinetti + - Shaddai Amolitos + - Kellen M Reason + - John B Johnston + - Janani Ravi + publisher: Cold Spring Harbor Laboratory + date: '2022-02-22' + link: https://doi.org/gstx7j + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1186/s13059-020-02021-3 + title: Compressing gene expression data using multiple latent space dimensionalities + learns complementary biological representations + authors: + - Gregory P. Way + - Michael Zietz + - Vincent Rubinetti + - Daniel S. Himmelstein + - Casey S. Greene + publisher: Genome Biology + date: '2020-05-11' + link: https://doi.org/gg2mjh + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1371/journal.pcbi.1007128 + title: Open collaborative writing with Manubot + authors: + - Daniel S. Himmelstein + - Vincent Rubinetti + - David R. Slochower + - Dongbo Hu + - Venkat S. Malladi + - Casey S. Greene + - Anthony Gitter + publisher: PLOS Computational Biology + date: '2020-12-04' + link: https://doi.org/c7np + orcid: 0000-0002-4655-3773 + plugin: sources.py + file: sources.yaml + type: paper + description: Lorem ipsum _dolor_ **sit amet**, consectetur adipiscing elit, sed + do eiusmod tempor incididunt ut labore et dolore magna aliqua. + image: https://journals.plos.org/ploscompbiol/article/figure/image?size=inline&id=info:doi/10.1371/journal.pcbi.1007128.g001&rev=2 + buttons: + - type: manubot + link: https://greenelab.github.io/meta-review/ - type: source - link: https://github.com/DBHammer/Touchstone + text: Manuscript Source + link: https://github.com/greenelab/meta-review + - type: website + link: http://manubot.org/ tags: - - Query-aware Data Generator - - OLAP Database Testing - - Query Generator -- id: 'Touchstone: Generating Enormous Query-Aware Test Databases' - title: 'Touchstone: Generating Enormous Query-Aware Test Databases' - link: https://www.usenix.org/conference/atc18/presentation/li-yuming - authors: - - Yuming Li - - Rong Zhang - - Xiaoyan Yang - - Zhenjie Zhang - - Aoying Zhou - publisher: USENIX Annual Technical Conference (USENIX ATC) - date: '2018-01-01' - image: /illustration/paper.touchstone.1.png - repo: DBHammer/Touchstone - extra-links: - - type: source - link: https://github.com/DBHammer/Touchstone -- id: doi:10.1016/j.tbench.2022.100031 - title: Are current benchmarks adequate to evaluate distributed transactional databases? - link: https://www.sciencedirect.com/science/article/pii/S2772485922000187 - authors: - - Luyi Qu - - Qingshuai Wang - - Ting Chen - - Keqiang Li - - Rong Zhang - - Xuan Zhou - - Quanqing Xu - - Zhifeng Yang - - Chuanhui Yang - - Weining Qian - - Aoying Zhou - publisher: BenchCouncil Transactions on Benchmarks, Standards and Evaluations - date: '2022-03-01' - link: https://doi.org/gqb25r - image: /illustration/AreCurrentBenchmark.jpg - extra-links: null -- id: doi:10.1007/s11704-020-0248-x - title: A comprehensive study on fault tolerance in stream processing systems - link: https://link.springer.com/article/10.1007/s11704-020-0248-x - authors: - - Xiaotong Wang - - Chunxi Zhang - - Junhua Fang - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2021-09-25' - link: https://doi.org/gqpncg -- id: doi:10.1007/s11704-022-1056-2 - title: Scalable and quantitative contention generation for performance evaluation - on OLTP databases - authors: - - Chunxi Zhang - - Yuming Li - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2022-08-09' - link: https://doi.org/gqpnch -- id: doi:10.1109/ICDE53745.2022.00036 - title: Application-Oriented Workload Generation for Transactional Database Performance Evaluation - link: https://ieeexplore.ieee.org/document/9835481 - authors: - - Luyi Qu - - Yuming Li - - Rong Zhang - - Ting Chen - - Ke Shu - - Weining Qian - - Aoying Zhou - publisher: IEEE 38th International Conference on Data Engineering (ICDE) - date: '2022-05-01' - link: https://doi.org/gqpnck -- id: doi:10.1109/TKDE.2019.2947055 - title: 'A-DSP: An Adaptive Join Algorithm for Dynamic Data Stream on Cloud System' - link: https://ieeexplore.ieee.org/document/8868214 - authors: - - Junhua Fang - - Rong Zhang - - Yan Zhao - - Kai Zheng - - Xiaofang Zhou - - Aoying Zhou - publisher: IEEE Transactions on Knowledge and Data Engineering (TKDE) + - open science + - collaboration + repo: greenelab/meta-review +- id: doi:10.1101/573782 + title: Sequential compression of gene expression across dimensionalities and methods + reveals no single best method or dimensionality + authors: + - Gregory P. Way + - Michael Zietz + - Vincent Rubinetti + - Daniel S. Himmelstein + - Casey S. Greene + publisher: Cold Spring Harbor Laboratory + date: '2019-03-11' + link: https://doi.org/gfxjxf + orcid: 0000-0002-4655-3773 + plugin: orcid.py + file: orcid.yaml +- id: doi:10.1016/j.csbj.2020.05.017 + title: Constructing knowledge graphs and their biomedical applications + authors: + - David N. Nicholson + - Casey S. Greene + publisher: Computational and Structural Biotechnology Journal date: '2020-01-01' - link: https://doi.org/gqpncm -- id: doi:10.1007/978-3-030-85896-4_15 - title: Dynamic Environment Simulation for Database Performance Evaluation - link: https://link.springer.com/chapter/10.1007/978-3-030-85896-4_15 - authors: - - Chunxi Zhang - - Rong Zhang - - Qian Su - - Aoying Zhou - publisher: Web and Big Data - date: '2021-01-01' - link: https://doi.org/gqpncn -- id: doi:10.1142/11709 - title: Load Balance for Distributed Real-time Computing Systems - authors: - - Junhua Fang - - Rong Zhang - - Aoying Zhou - publisher: East China Normal University Scientific Reports - date: '2020-07-01' - link: https://doi.org/gqpncp -- id: doi:10.1007/s11704-019-8438-0 - title: Benchmarking on intensive transaction processing - link: https://link.springer.com/article/10.1007/s11704-019-8438-0 - authors: - - Chunxi Zhang - - Yuming Li - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2020-01-03' - link: https://doi.org/gqpncq -- id: doi:10.1007/978-3-030-60290-1_8 - title: Evaluating Fault Tolerance of Distributed Stream Processing Systems - link: https://link.springer.com/chapter/10.1007/978-3-030-60290-1_8 - authors: - - Xiaotong Wang - - Cheng Jiang - - Junhua Fang - - Ke Shu - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Web and Big Data - date: '2020-01-01' - link: https://doi.org/gqpncs -- id: doi:10.1007/978-3-030-60290-1_34 - title: Quantitative Contention Generation for Performance Evaluation on OLTP Databases - link: https://link.springer.com/chapter/10.1007/978-3-030-60290-1_34 - authors: - - Chunxi Zhang - - Rong Zhang - - Weining Qian - - Ke Shu - - Aoying Zhou - publisher: Web and Big Data - date: '2020-01-01' - link: https://doi.org/gqpnct -- id: doi:10.1007/978-3-030-71058-3_5 - title: 'Artemis: An Automatic Test Suite Generator for Large Scale OLAP Database' - link: https://link.springer.com/chapter/10.1007/978-3-030-71058-3_5 - authors: - - Kaiming Mi - - Chunxi Zhang - - Weining Qian - - Rong Zhang - publisher: Benchmarking, Measuring, and Optimizing - date: '2021-01-01' - link: https://doi.org/gqpncv -- id: doi:10.1007/s11280-018-0656-0 - title: Integrating workload balancing and fault tolerance in distributed stream - processing system - authors: - - Junhua Fang - - Pingfu Chao - - Rong Zhang - - Xiaofang Zhou - publisher: World Wide Web - date: '2019-01-07' - link: https://doi.org/gqpncw -- id: doi:10.1007/978-3-030-26075-0_15 - title: 'Apara: Workload-Aware Data Partition and Replication for Parallel Databases' - authors: - - Xiaolei Zhang - - Chunxi Zhang - - Yuming Li - - Rong Zhang - - Aoying Zhou - publisher: Web and Big Data - date: '2019-01-01' - link: https://doi.org/gqpncx -- id: doi:10.1007/s11704-016-6194-y - title: Distribution-free data density estimation in large-scale networks - authors: - - Minqi Zhou - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2018-12-01' - link: https://doi.org/gqpncz -- id: doi:10.1109/TPDS.2018.2827380 - title: Distributed Stream Rebalance for Stateful Operator Under Workload Variance - authors: - - Junhua Fang - - Rong Zhang - - Tom Z. J. Fu - - Zhenjie Zhang - - Aoying Zhou - - Xiaofang Zhou - publisher: IEEE Transactions on Parallel and Distributed Systems - date: '2018-10-01' - link: https://doi.org/gfbfnj -- id: doi:10.1007/978-3-030-32813-9_13 - title: Benchmarking for Transaction Processing Database Systems in Big Data Era - authors: - - Chunxi Zhang - - Yuming Li - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: Benchmarking, Measuring, and Optimizing - date: '2019-01-01' - link: https://doi.org/gnf67r -- id: doi:10.1007/978-3-319-91458-9_52 - title: 'AdaptMX: Flexible Join-Matrix Streaming System for Distributed Theta-Joins' - authors: - - Xiaotong Wang - - Cheng Jiang - - Junhua Fang - - Xiangfeng Wang - - Rong Zhang - publisher: Database Systems for Advanced Applications - date: '2018-01-01' - link: https://doi.org/gqpnc3 -- id: doi:10.1007/s11280-017-0431-7 - title: Distributed stream join under workload variance - authors: - - Junhua Fang - - Rong Zhang - - Xiaotong Wang - - Aoying Zhou - publisher: World Wide Web - date: '2017-01-23' - link: https://doi.org/gqpnc4 -- id: doi:10.1007/978-3-319-55699-4_39 - title: Cost-Effective Data Partition for Distributed Stream Processing System - authors: - - Xiaotong Wang - - Junhua Fang - - Yuming Li - - Rong Zhang - - Aoying Zhou - publisher: Database Systems for Advanced Applications - date: '2017-01-01' - link: https://doi.org/gqpndj -- id: doi:10.1145/3078597.3078613 - title: Parallel Stream Processing Against Workload Skewness and Variance - authors: - - Junhua Fang - - Rong Zhang - - Tom Z.J. Fu - - Zhenjie Zhang - - Aoying Zhou - - Junhua Zhu - publisher: Proceedings of the 26th International Symposium on High-Performance Parallel - and Distributed Computing - date: '2017-06-26' - link: https://doi.org/gqpnm2 -- id: doi:10.1007/s10115-015-0880-1 - title: Learning user credibility for product ranking - authors: - - Rong Zhang - - Ming Gao - - Xiaofeng He - - Aoying Zhou - publisher: Knowledge and Information Systems - date: '2015-09-30' - link: https://doi.org/f79gqn -- id: doi:10.1007/978-3-319-45817-5_1 - title: Flexible and Adaptive Stream Join Algorithm - authors: - - Junhua Fang - - Xiaotong Wang - - Rong Zhang - - Aoying Zhou - publisher: Web Technologies and Applications - date: '2016-01-01' - link: https://doi.org/gqpnm4 -- id: doi:10.1007/978-3-319-45814-4_2 - title: 'NERank: Ranking Named Entities in Document Collections' - authors: - - Chengyu Wang - - Rong Zhang - - Xiaofeng He - - Guomin Zhou - - "Aoying Zhou" - publisher: Web Technologies and Applications - date: '2016-01-01' - link: https://doi.org/gqpnm5 -- id: doi:10.1145/2983323.2983705 - title: Error Link Detection and Correction in Wikipedia - authors: - - Chengyu Wang - - Rong Zhang - - Xiaofeng He - - Aoying Zhou - publisher: Proceedings of the 25th ACM International on Conference on Information - and Knowledge Management - date: '2016-10-24' - link: https://doi.org/gqpnm6 -- id: doi:10.1145/2983323.2983773 - title: Cost-Effective Stream Join Algorithm on Cloud System - authors: - - Junhua Fang - - Rong Zhang - - Xiaotong Wang - - Tom Z.J. Fu - - Zhenjie Zhang - - Aoying Zhou - publisher: Proceedings of the 25th ACM International on Conference on Information - and Knowledge Management - date: '2016-10-24' - link: https://doi.org/gqpnnb -- id: doi:10.1007/978-3-319-39958-4_7 - title: Learning User Credibility on Aspects from Review Texts - authors: - - Yifan Gao - - Yuming Li - - Yanhong Pan - - Jiali Mao - - Rong Zhang - publisher: Web-Age Information Management - date: '2016-01-01' - link: https://doi.org/gqpnnd -- id: doi:10.1007/978-3-319-48740-3_35 - title: Event Phase Extraction and Summarization - authors: - - Chengyu Wang - - Rong Zhang - - Xiaofeng He - - Guomin Zhou - - Aoying Zhou - publisher: "Web Information Systems Engineering \u2013 WISE 2016" - date: '2016-01-01' - link: https://doi.org/gqpnng -- id: doi:10.1145/2872518.2889348 - title: 'NERank: Ranking Named Entities in Document Collections' - authors: - - Chengyu Wang - - Rong Zhang - - Xiaofeng He - - Aoying Zhou - publisher: Proceedings of the 25th International Conference Companion on World Wide - Web - WWW '16 Companion - date: '2016-01-01' - link: https://doi.org/gqpnnh -- id: doi:10.1007/s11704-014-3492-0 - title: Product-oriented review summarization and scoring - authors: - - Rong Zhang - - Wenzhe Yu - - Chaofeng Sha - - Xiaofeng He - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2015-01-21' - link: https://doi.org/gqpnnk -- id: doi:10.1007/s11280-014-0296-y - title: Detecting anomaly in data streams by fractal model - authors: - - Rong Zhang - - Minqi Zhou - - Xueqing Gong - - Xiaofeng He - - Weining Qian - - Shouke Qin - - Aoying Zhou - publisher: World Wide Web - date: '2014-06-10' - link: https://doi.org/gqpnnm -- id: doi:10.1109/WISA.2015.63 - title: 'ACID Encountering the CAP Theorem: Two Bank Case Studies' - authors: - - Chao Kong - - Ming Gao - - Weining Qian - - Minqi Zhou - - Xueqing Gong - - Rong Zhang - - Aoying Zhou - publisher: 2015 12th Web Information System and Application Conference (WISA) - date: '2015-09-01' - link: https://doi.org/gqpnnp -- id: doi:10.1007/978-3-319-19548-3_29 - title: 'SEMI: A Scalable Entity Matching System Based on MapReduce' - authors: - - Pingfu Chao - - Yuming Li - - Zhu Gao - - Junhua Fang - - Xiaofeng He - - Rong Zhang - publisher: Lecture Notes in Computer Science - date: '2015-01-01' - link: https://doi.org/gqpnnq -- id: doi:10.1007/978-3-319-28121-6_15 - title: Multi-dimensional User Credibility Analysis on Review Content - authors: - - Yifan Gao - - Yuming Li - - Rong Zhang - publisher: Web Technologies and Applications - date: '2015-01-01' - link: https://doi.org/gqpnnr -- id: doi:10.1007/978-3-319-25255-1_42 - title: Random-Based Algorithm for Efficient Entity Matching - authors: - - Pingfu Chao - - Zhu Gao - - Yuming Li - - Junhua Fang - - Rong Zhang - - Aoying Zhou - publisher: Web Technologies and Applications - date: '2015-01-01' - link: https://doi.org/gqpnns -- id: doi:10.1007/978-3-319-25255-1_51 - title: User Generated Content Oriented Chinese Taxonomy Construction - authors: - - Jinyang Li - - Chengyu Wang - - Xiaofeng He - - Rong Zhang - - Ming Gao - publisher: Web Technologies and Applications - date: '2015-01-01' - link: https://doi.org/gqpnnt -- id: doi:10.1007/978-3-319-18123-3_33 - title: A Restaurant Recommendation System by Analyzing Ratings and Aspects in Reviews - authors: - - Yifan Gao - - Wenzhe Yu - - Pingfu Chao - - Rong Zhang - - Aoying Zhou - - Xiaoyan Yang - publisher: Database Systems for Advanced Applications - date: '2015-01-01' - link: https://doi.org/gqpnnv -- id: doi:10.1109/ICDEW.2015.7129545 - title: Challenges in Chinese knowledge graph construction - authors: - - Chengyu Wang - - Ming Gao - - Xiaofeng He - - Rong Zhang - publisher: 2015 31st IEEE International Conference on Data Engineering Workshops - date: '2015-04-01' - link: https://doi.org/gqpnnw -- id: doi:10.1109/ICDE.2015.7113308 - title: Dish comment summarization based on bilateral topic analysis - authors: - - Rong Zhang - - Zhenjie Zhang - - Xiaofeng He - - Aoying Zhou - publisher: 2015 IEEE 31st International Conference on Data Engineering - date: '2015-04-01' - link: https://doi.org/gqpnnx -- id: doi:10.1007/978-3-319-21042-1_20 - title: Review Comment Analysis for Predicting Ratings - authors: - - Rong Zhang - - Yifan Gao - - Wenzhe Yu - - Pingfu Chao - - Xiaoyan Yang - - Ming Gao - - Aoying Zhou - publisher: Web-Age Information Management - date: '2015-01-01' - link: https://doi.org/gqpnnz -- id: doi:10.1007/978-3-319-21042-1_30 - title: Computing Probability Threshold Set Similarity on Probabilistic Sets - authors: - - Lei Wang - - Ming Gao - - Rong Zhang - - Cheqing Jin - - Aoying Zhou - publisher: Web-Age Information Management - date: '2015-01-01' - link: https://doi.org/gqpnpc -- id: doi:10.1007/978-3-319-21042-1_48 - title: Efficient MapReduce-Based Method for Massive Entity Matching - authors: - - Pingfu Chao - - Zhu Gao - - Yuming Li - - Junhua Fang - - Rong Zhang - - Aoying Zhou - publisher: Web-Age Information Management - date: '2015-01-01' - link: https://doi.org/gqpnpf -- id: doi:10.1002/dac.2619 - title: 'MR-tree: an efficient index for MapReduce' - authors: - - Chunsheng Li - - Jie Chen - - Cheqing Jin - - Rong Zhang - - Aoying Zhou - publisher: International Journal of Communication Systems - date: '2013-08-08' - link: https://doi.org/gqpnpn -- id: doi:10.1109/ASONAM.2014.6921558 - title: Online evaluation re-scoring based on review behavior analysis - authors: - - Rong Zhang - - Xiaofeng He - - Aoying Zhou - - Chaofeng Sha - publisher: 2014 IEEE/ACM International Conference on Advances in Social Networks - Analysis and Mining (ASONAM 2014) - date: '2014-08-01' - link: https://doi.org/gqpnpq -- id: doi:10.1007/978-3-319-05810-8_27 - title: Probabilistic Reverse Top-k Queries - authors: - - Cheqing Jin - - Rong Zhang - - Qiangqiang Kang - - Zhao Zhang - - Aoying Zhou - publisher: Database Systems for Advanced Applications - date: '2014-01-01' - link: https://doi.org/gqpnpr -- id: doi:10.1007/978-3-319-05813-9_36 - title: 'TaxiHailer: A Situation-Specific Taxi Pick-Up Points Recommendation System' - authors: - - Leyi Song - - Chengyu Wang - - Xiaoyi Duan - - Bing Xiao - - Xiao Liu - - Rong Zhang - - Xiaofeng He - - Xueqing Gong - publisher: Database Systems for Advanced Applications - date: '2014-01-01' - link: https://doi.org/gqpnpv -- id: doi:10.1007/s11704-013-1256-x - title: Context-sensitive Web service discovery over the bipartite graph model - authors: - - Rong Zhang - - Koji Zettsu - - Yutaka Kidawara - - Yasushi Kiyoki - - Aoying Zhou - publisher: Frontiers of Computer Science - date: '2013-09-25' - link: https://doi.org/gqpnpw -- id: doi:10.1007/978-3-642-37401-2_70 - title: Selecting a Diversified Set of Reviews - authors: - - Wenzhe Yu - - Rong Zhang - - Xiaofeng He - - Chaofeng Sha - publisher: Web Technologies and Applications - date: '2013-01-01' - link: https://doi.org/gqpnqh -- id: doi:10.1007/978-3-642-37450-0_28 - title: A Hybrid Framework for Product Normalization in Online Shopping - authors: - - Li Wang - - Rong Zhang - - Chaofeng Sha - - Xiaofeng He - - Aoying Zhou - publisher: Database Systems for Advanced Applications - date: '2013-01-01' - link: https://doi.org/gqpnqk -- id: doi:10.1109/ICDM.2013.62 - title: Search Behavior Based Latent Semantic User Segmentation for Advertising Targeting - authors: - - Xueqing Gong - - Xinyu Guo - - Rong Zhang - - Xiaofeng He - - Aoying Zhou - publisher: 2013 IEEE 13th International Conference on Data Mining - date: '2013-12-01' - link: https://doi.org/gqpnqm -- id: doi:10.1007/978-3-642-39527-7_37 - title: Threshold Selection for Classification with Skewed Class Distribution - authors: - - Xiaofeng He - - Rong Zhang - - Aoying Zhou - publisher: Web-Age Information Management - date: '2013-01-01' - link: https://doi.org/gqpnqn -- id: doi:10.1007/978-3-642-41230-1_46 - title: "Predicting Users\u2019 Age Range in Micro-blog Network" - authors: - - Chengyu Wang - - Bing Xiao - - Xiang Li - - Jiawen Zhu - - Xiaofeng He - - Rong Zhang - publisher: Lecture Notes in Computer Science - date: '2013-01-01' - link: https://doi.org/gqpnqp -- id: doi:10.1109/CGC.2012.11 - title: Web Service Ranking Based on Context - authors: - - Rong Zhang - - Koji Zettsu - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: 2012 Second International Conference on Cloud and Green Computing - date: '2012-11-01' - link: https://doi.org/gqpnqq -- id: doi:10.1145/2396761.2398591 - title: Credibility-based product ranking for C2C transactions - authors: - - Rong Zhang - - Chao Feng Sha - - Min Qi Zhou - - Ao Ying Zhou - publisher: Proceedings of the 21st ACM international conference on Information and - knowledge management - CIKM '12 - date: '2012-01-01' - link: https://doi.org/gqpnqr -- id: doi:10.1145/2187980.2188171 - title: Exploiting shopping and reviewing behavior to re-score online evaluations - authors: - - Rong Zhang - - ChaoFeng Sha - - Minqi Zhou - - Aoying Zhou - publisher: Proceedings of the 21st international conference companion on World Wide - Web - WWW '12 Companion - date: '2012-01-01' - link: https://doi.org/gqpnqt -- id: doi:10.1007/978-3-642-20149-3_31 - title: Context-Sensitive Query Expansion over the Bipartite Graph Model for Web - Service Search - authors: - - Rong Zhang - - Koji Zettsu - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: Database Systems for Advanced Applications - date: '2011-01-01' - link: https://doi.org/frhnnr -- id: doi:10.1109/IUCS.2010.5666772 - title: 'Services in the Cloud Computing era: A survey' - authors: - - Minqi Zhou - - Rong Zhang - - Dadan Zeng - - Weining Qian - publisher: 2010 4th International Universal Communication Symposium - date: '2010-10-01' - link: https://doi.org/c8b9hw -- id: doi:10.1109/SKG.2010.18 - title: Join Optimization in the MapReduce Environment for Column-wise Data Store - authors: - - Minqi Zhou - - Rong Zhang - - Dadan Zeng - - Weining Qian - - Aoying Zhou - publisher: 2010 Sixth International Conference on Semantics, Knowledge and Grids - date: '2010-11-01' - link: https://doi.org/bfbt2f -- id: doi:10.1109/SKG.2010.19 - title: 'Security and Privacy in Cloud Computing: A Survey' - authors: - - Minqi Zhou - - Rong Zhang - - Wei Xie - - Weining Qian - - Aoying Zhou - publisher: 2010 Sixth International Conference on Semantics, Knowledge and Grids - date: '2010-11-01' - link: https://doi.org/fgjt5x -- id: doi:10.1007/978-3-642-14246-8_36 - title: Exploiting Service Context for Web Service Search Engine - authors: - - Rong Zhang - - Koji Zettsu - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: Web-Age Information Management - date: '2010-01-01' - link: https://doi.org/dqv5s7 -- id: doi:10.1016/j.future.2008.02.010 - title: An efficient peer-to-peer indexing tree structure for multidimensional data - authors: - - Rong Zhang - - Weining Qian - - Aoying Zhou - - Minqi Zhou - publisher: Future Generation Computer Systems - date: '2009-01-01' - link: https://doi.org/dfs3xw -- id: doi:10.1145/1667780.1667834 - title: 'SOBEX: distributed service search engine that exploits service collaboration - context' - authors: - - Rong Zhang - - Koji Zettsu - - Takafumi Nakanishi - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: Proceedings of the 3rd International Universal Communication Symposium - on - IUCS '09 - date: '2009-01-01' - link: https://doi.org/dvndb6 -- id: doi:10.1109/SKG.2009.89 - title: Context-Based Web Service Clustering - authors: - - Rong Zhang - - Koji Zettsu - - Takafumi Nakanishi - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: 2009 Fifth International Conference on Semantics, Knowledge and Grid - date: '2009-01-01' - link: https://doi.org/dbvvkf -- id: doi:10.1016/j.datak.2008.06.013 - title: Adaptive indexing for content-based search in P2P systems - authors: - - Aoying Zhou - - Rong Zhang - - Weining Qian - - Quang Hieu Vu - - Tianming Hu - publisher: Data & Knowledge Engineering - date: '2008-12-01' - link: https://doi.org/ctdjnc -- id: doi:10.1007/s11704-008-0025-8 - title: Decentralized architecture for resource management of group-based distributed - systems - authors: - - Rong Zhang - - Koji Zettsu - - Yutaka Kidawara - - Yasushi Kiyoki - publisher: Frontiers of Computer Science in China - date: '2008-08-12' - link: https://doi.org/dq85w5 -- id: doi:10.1109/ICDE.2008.4497617 - title: 'COSTA: Adaptive Indexing for Terms in a Large-scale Distributed System' - authors: - - Aoying Zhou - - Rong Zhang - - Quang Hieu Vu - - Weining Qian - publisher: 2008 IEEE 24th International Conference on Data Engineering - date: '2008-04-01' - link: https://doi.org/b3fqd6 -- id: doi:10.1007/978-3-540-71703-4_7 - title: 'GChord: Indexing for Multi-Attribute Query in P2P System with Low Maintenance - Cost' - authors: - - Minqi Zhou - - Rong Zhang - - Weining Qian - - Aoying Zhou - publisher: 'Advances in Databases: Concepts, Systems and Applications' - date: '2007-01-01' - link: https://doi.org/brz9pg -- id: doi:10.4108/infoscale.2007.908 - title: 'SDI: A Swift Tree Structure for Multi-dimensional Data Indexing in Peer-to-Peer - Networks' - authors: - - Rong Zhang - - Weining Qian - - Minqi Zhou - - Aoying Zhou - publisher: Proceedings of the 2nd International ICST Conference on Scalable Information - Systems - date: '2007-01-01' - link: https://doi.org/gqpnrg -- id: doi:10.1109/ICDE.2006.169 - title: 'VBI-Tree: A Peer-to-Peer Framework for Supporting Multi-Dimensional Indexing - Schemes' - authors: - - H.V. Jagadish - - ' Beng Chin Ooi' - - ' Quang Hieu Vu' - - ' Rong Zhang' - - ' Aoying Zhou' - publisher: 22nd International Conference on Data Engineering (ICDE'06) - date: '2006-01-01' - link: https://doi.org/cxtt65 -- id: doi:10.1145/1142473.1142475 - title: Speeding up search in peer-to-peer networks with a multi-way tree structure - authors: - - H. V. Jagadish - - Beng Chin Ooi - - Kian-Lee Tan - - Quang Hieu Vu - - Rong Zhang - publisher: Proceedings of the 2006 ACM SIGMOD international conference on Management - of data - SIGMOD '06 - date: '2006-01-01' - link: https://doi.org/dg6354 - -- id: "\u9762\u5411\u5206\u5e03\u5f0f\u4e8b\u52a1\u578b\u6570\u636e\u5e93\u7cfb\u7edf\ - \u7684\u8bc4\u6d4b\u57fa\u51c6\u8bbe\u8ba1\u4e0e\u5b9e\u73b0\u0020" - manual: true - title: "\u9762\u5411\u5206\u5e03\u5f0f\u4e8b\u52a1\u578b\u6570\u636e\u5e93\u7cfb\u7edf\ - \u7684\u8bc4\u6d4b\u57fa\u51c6\u8bbe\u8ba1\u4e0e\u5b9e\u73b0\u0020" - publisher: "\u0043\u0043\u0046\u4e2d\u56fd\u6570\u636e\u5e93\u5b66\u672f\u4f1a\u8bae (NDBC)" - authors: - - "\u4f55\u6d77\u6797\u0020" - - "\u5f20\u60e0\u4e1c" - - "\u7FC1\u601D\u626C" - - "\u5F20\u84C9" - date: '2024-07-01' - -- id: "HTAP\u8bc4\u6d4b\u57fa\u51c6\u7684\u8bc4\u6d4b\u80fd\u529b\u7efc\u8ff0" - manual: true - title: "HTAP\u8bc4\u6d4b\u57fa\u51c6\u7684\u8bc4\u6d4b\u80fd\u529b\u7efc\u8ff0" - publisher: "\u8F6F\u4EF6\u5B66\u62A5" - link: https://jos.org.cn/jos/article/pdf/7225 - authors: - - "\u7FC1\u601D\u626C" - - "\u4fde\u878d" - - "\u738B\u6E05\u5E05" - - "\u80E1\u6893\u9510" - - "\u502a\u844e" - - "\u5F20\u84C9" - - "\u5468\u70DC" - - "\u5468\u50B2\u82F1" - - "\u5F90\u6CC9\u6E05" - - "\u6768\u4F20\u8F89" - - "\u5218\u7EF4" - - "\u6768\u6500\u98DE" - date: '2024-05-20' -- id: "HTAP\u6570\u636E\u5E93\u7CFB\u7EDF\u6570\u636E\u5171\u4EAB\u6A21\u578B\u4E0E\ - \u4F18\u5316\u7B56\u7565" - manual: true - title: "HTAP\u6570\u636E\u5E93\u7CFB\u7EDF\u6570\u636E\u5171\u4EAB\u6A21\u578B\u4E0E\ - \u4F18\u5316\u7B56\u7565" - publisher: "\u8F6F\u4EF6\u5B66\u62A5" - link: https://jos.org.cn/jos/article/pdf/6901 - authors: - - "\u80E1\u6893\u9510" - - "\u7FC1\u601D\u626C" - - "\u4FDE\u878D" - - "\u5F90\u91D1\u51EF" - - "\u738B\u6E05\u5E05" - - "\u5F20\u84C9" - - "\u5468\u70DC" - date: '2023-07-12' -- manual: true - id: "\u9762\u5411\u590D\u6742\u67E5\u8BE2\u7684\u53EF\u6269\u5C55\u5E94\u7528\u573A\ - \u666F\u751F\u6210" - title: "\u9762\u5411\u590D\u6742\u67E5\u8BE2\u7684\u53EF\u6269\u5C55\u5E94\u7528\ - \u573A\u666F\u751F\u6210" - publisher: "\u0043\u0043\u0046\u4e2d\u56fd\u6570\u636e\u5e93\u5b66\u672f\u4f1a\u8bae (NDBC)" - authors: - - "\u674E\u597D" - - "\u738B\u6E05\u5E05" - - "\u5F20\u84C9" - - "\u94B1\u536B\u5B81" - date: '2022-08-20' -- id: "\u5206\u5E03\u5F0F\u6570\u636E\u6D41\u4E0A\u7684\u9AD8\u6027\u80FD\u5206\u53D1\ - \u7B56\u7565" - manual: true - title: "\u5206\u5E03\u5F0F\u6570\u636E\u6D41\u4E0A\u7684\u9AD8\u6027\u80FD\u5206\ - \u53D1\u7B56\u7565" - publisher: "\u8F6F\u4EF6\u5B66\u62A5" - authors: - - "\u623F\u4FCA\u534E" - - "\u738B\u6653\u6850" - - "\u5F20\u84C9" - - "\u5468\u50B2\u82F1" - date: '2016-01-01' -- id: "\u8003\u8651\u89C2\u70B9\u591A\u6837\u6027\u7684\u8BC4\u8BBA\u9009\u62E9\u95EE\ - \u9898" - manual: true - title: "\u8003\u8651\u89C2\u70B9\u591A\u6837\u6027\u7684\u8BC4\u8BBA\u9009\u62E9\ - \u95EE\u9898" - publisher: "\u8BA1\u7B97\u673A\u7814\u7A76\u4E0E\u53D1\u5C55" - authors: - - "\u4F59\u6587\u5586" - - "\u6C99\u671D\u950B" - - "\u4F55\u6653\u4E30" - - "\u5F20\u84C9" - date: '2015-05-15' -- id: "\u7535\u5B50\u5546\u52A1\u5546\u54C1\u5F52\u4E00\u5316\u65B9\u6CD5\u7814\u7A76" - manual: true - title: "\u7535\u5B50\u5546\u52A1\u5546\u54C1\u5F52\u4E00\u5316\u65B9\u6CD5\u7814\ - \u7A76" - publisher: "\u8BA1\u7B97\u673A\u5B66\u62A5" - authors: - - "\u738B\u7ACB" - - "\u5F20\u84C9" - - "\u6C99\u671D\u950B" - - "\u738B\u6653\u73B2" - - "\u5468\u50B2\u82F1" - date: '2014-01-01' -- id: "\u7535\u5B50\u5546\u52A1\u7CFB\u7EDF\u4E2D\u7684\u5546\u54C1\u63A8\u8350\u7CFB\ - \u7EDF" - manual: true - title: "\u7535\u5B50\u5546\u52A1\u7CFB\u7EDF\u4E2D\u7684\u5546\u54C1\u63A8\u8350\ - \u7CFB\u7EDF" - publisher: "\u534E\u4E1C\u5E08\u8303\u5927\u5B66\u5B66\u62A5" - authors: - - "\u4F59\u6587\u5586" - - "\u5F20\u84C9" - - "\u738B\u7ACB" - date: '2013-01-01' -- id: "\u4E00\u79CD\u652F\u6301\u591A\u7EF4\u6570\u636E\u8303\u56F4\u67E5\u8BE2\u7684\ - \u5BF9\u7B49\u8BA1\u7B97\u7D22\u5F15\u6846\u67B6" - manual: true - title: "\u4E00\u79CD\u652F\u6301\u591A\u7EF4\u6570\u636E\u8303\u56F4\u67E5\u8BE2\ - \u7684\u5BF9\u7B49\u8BA1\u7B97\u7D22\u5F15\u6846\u67B6" - publisher: "\u8BA1\u7B97\u673A\u7814\u7A76\u4E0E\u53D1\u5C55" - authors: - - "\u5F20\u84C9" - - "\u94B1\u536B\u5B81" - - "\u5468\u50B2\u82F1" - date: '2009-01-01' -- id: "\u5927\u89C4\u6A21\u5206\u5E03\u5F0F\u7CFB\u7EDF\u4E2D\u7684\u591A\u5C5E\u6027\ - \u67E5\u8BE2\u5904\u7406" - manual: true - title: "\u5927\u89C4\u6A21\u5206\u5E03\u5F0F\u7CFB\u7EDF\u4E2D\u7684\u591A\u5C5E\ - \u6027\u67E5\u8BE2\u5904\u7406" - publisher: "\u8BA1\u7B97\u673A\u5B66\u62A5" - authors: - - "\u5468\u50B2\u82F1" - - "\u5468\u654F\u5947" - - "\u94B1\u536B\u5B81" - - "\u5F20\u84C9" - date: '2008-01-01' -- id: "\u4E00\u7AD9\u5F0F\u670D\u52A1\u63A8\u8350\u7CFB\u7EDF" - manual: true - title: "\u4E00\u7AD9\u5F0F\u670D\u52A1\u63A8\u8350\u7CFB\u7EDF" - publisher: \u0043\u0043\u0046\u4e2d\u56fd\u6570\u636e\u5e93\u5b66\u672f\u4f1a\u8bae (NDBC) - authors: - - "\u9AD8\u794E\u74A0" - - "\u90D1\u82B7\u51CC" - - "\u4F59\u6587\u5586" - - "\u7A0B\u6587\u4EAE" - - "\u5F20\u84C9" - date: '2014-01-01' \ No newline at end of file + link: https://doi.org/gg7m48 + image: https://ars.els-cdn.com/content/image/1-s2.0-S2001037020302804-gr1.jpg + plugin: sources.py + file: sources.yaml +- id: doi:10.7554/eLife.32822 + title: Sci-Hub provides access to nearly all scholarly literature + authors: + - Daniel S Himmelstein + - Ariel Rodriguez Romero + - Jacob G Levernier + - Thomas Anthony Munro + - Stephen Reid McLaughlin + - Bastian Greshake Tzovaras + - Casey S Greene + publisher: eLife + date: '2018-03-01' + link: https://doi.org/ckcj + image: https://iiif.elifesciences.org/lax:32822%2Felife-32822-fig8-v3.tif/full/863,/0/default.webp + plugin: sources.py + file: sources.yaml diff --git a/_includes/head.html b/_includes/head.html index 28219ef..c21a44a 100644 --- a/_includes/head.html +++ b/_includes/head.html @@ -1,7 +1,7 @@ {% include analytics.html %} + {% include verification.html %} {% include meta.html %} - {% include favicons.html %} {% include fonts.html %} {% include styles.html %} {% include scripts.html %} diff --git a/_includes/link.html b/_includes/link.html new file mode 100644 index 0000000..5b37065 --- /dev/null +++ b/_includes/link.html @@ -0,0 +1,36 @@ +{%- assign type = include.type | default: "link" -%} +{%- assign type = site.data.links[type] -%} +{%- assign link = include.link -%} + +{%- if type and link -%} + + {%- assign icon = include.icon -%} + {%- if icon == "" -%} + {%- assign icon = type.icon -%} + {%- endif -%} + + {%- assign text = include.text -%} + {%- if text == "" -%} + {%- assign text = type.text -%} + {%- endif -%} + + {%- assign tooltip = include.tooltip -%} + {%- if tooltip == "" -%} + {%- assign tooltip = type.tooltip -%} + {%- endif -%} + + {%- assign link = type.link | replace: "$LINK", link -%} + + {%- assign flip = include.flip | default: false -%} + + + {%- if icon contains "fa-" -%} + + {%- elsif icon -%} + {% include {{ icon }} %} + {%- endif -%} + {%- if text -%} + {{ text }} + {%- endif -%} + +{%- endif -%} diff --git "a/_posts/2022-05-28-OceanBase\344\270\216TiDB\344\274\230\345\214\226\345\231\250\347\232\204\345\237\272\346\225\260\351\242\204\344\274\260\345\207\206\347\241\256\345\272\246\345\222\214\350\277\236\346\216\245\351\241\272\345\272\217\351\200\211\346\213\251\350\203\275\345\212\233\347\232\204\350\257\204\346\265\213.md" "b/_posts/2022-05-28-OceanBase\344\270\216TiDB\344\274\230\345\214\226\345\231\250\347\232\204\345\237\272\346\225\260\351\242\204\344\274\260\345\207\206\347\241\256\345\272\246\345\222\214\350\277\236\346\216\245\351\241\272\345\272\217\351\200\211\346\213\251\350\203\275\345\212\233\347\232\204\350\257\204\346\265\213.md" deleted file mode 100644 index 90e0f82..0000000 --- "a/_posts/2022-05-28-OceanBase\344\270\216TiDB\344\274\230\345\214\226\345\231\250\347\232\204\345\237\272\346\225\260\351\242\204\344\274\260\345\207\206\347\241\256\345\272\246\345\222\214\350\277\236\346\216\245\351\241\272\345\272\217\351\200\211\346\213\251\350\203\275\345\212\233\347\232\204\350\257\204\346\265\213.md" +++ /dev/null @@ -1,456 +0,0 @@ ---- -title: OceanBase与TiDB优化器的基数预估准确度和连接顺序选择能力的评测 -tags: oceanbase tidb -author: 项兆坤 -member: 项兆坤 ---- - -## 一、引言 - -查询优化器作为数据库查询引擎的大脑,负责生成理想的执行计划,一直以来都被认为是查询引擎中最重要最核心的部分。现代数据库系统的优化器都是基于代价的优化器(Cost-based Optimizer, CBO),使用代价模型选出最佳的执行计划。相关研究表明,提升基数预估的准确度比代价模型中的CPU权重、IO权重等参数的作用大的多。另一方面,由于多表连接负载存在着庞大的连接顺序搜索空间,为多表连接负载确定最优的连接顺序也是一项艰难的任务。因此,优化器在不同情况下的基数预估准确度和连接顺序选择的质量可作为评测优化器的两个关键要点。本文将使用自研的工具对OceanBase、TiDB的基数预估、连接顺序选择的质量以及对于复杂连接形状的处理能力做出评测和对比。 - -## 二、背景知识和实验设置 - -## 1.基数预估 - -基数预估的作用是预估查询执行计划中算子的输出结果集大小。作为代价模型中的重要参数,基数预估的准确度会对查询执行计划的选择造成很大的影响,确保基数预估的准确度十分重要。在OceanBase和TiDB中,均可使用Explain关键字来查看优化器选出的执行计划中所有算子的基数预估结果。比如,在OceanBase中,对负载SELECT * FROM t1,t2 WHERE t1.c2=t2.c2 AND t2.c1 > 4 的Explain结果如下所示\[1\],表示OceanBase选定HashJoin作为表t1和t2之间连接的物理算法,预估的连接基数大小为9801000。 - -``` -`Query Plan: -======================================= -|ID|OPERATOR |NAME|EST. ROWS|COST | ---------------------------------------- -|0 |HASH JOIN | |9801000 |5933109| -|1 | TABLE SCAN|t2 |10000 |6219 | -|2 | TABLE SCAN|t1 |100000 |68478 | -=======================================` -``` - -## 2.连接形式和连接顺序 - -连接形式也叫连接图(Join Graph),文献\[2\]中总结了可能出现的一些连接图,如图1所示,主要包括链式连接(Chain)、星型连接(Star)、树型连接(Tree)、环型连接(Cycle)、集团连接(Clique)等。其中,Cycle、Clique、Cyclic及Grid形式的连接比较复杂,在构建连接的过程中,这些形式的连接会导致新参与连接的表与已经连接的表之间存在多个连接关系,在本文中,我们称这些连接形式为复杂连接形式。 - - - -图1 连接图\[2\] -{:.center} - -对于N表连接负载,存在的连接顺序有(2\*N-2)!/(N-1)!个,优化器会使用一些方法(比如动态规划或贪心算法)来枚举连接顺序。由于枚举所有可能的连接顺序的代价较大,因此优化器只会枚举其子集,这可能导致优化器无法为某些多表连接负载确定最佳的连接顺序。另一方面,基数预估和连接顺序的选择是相互影响的,基数预估通过影响代价模型,从而对连接顺序的选择造成影响。同时,不同的连接顺序也会影响基数预估。同样的多表连接,不同数据库的优化器可能选出不同的连接顺序,因此,使用相同的多表连接负载测试不同数据库对其连接算子的基数预估准确度时,应固定相同的连接顺序。OceanBase和TiDB分别提供了LEADING和/\*! STRAIGHT_JOIN */关键字来指定数据库以特定的连接顺序执行多表连接负载。 - -## 3.实验环境 - -由于查询优化器代价模型暂时无法控制,为了降低分布式环境下代价模型的影响,本文实验使用的Oceanbase和TiDB均为单机版。Oceanbase的版本为3.1.2,TiDB的版本为6.0,其中TiDB单机版包括一个TiDB组件、一个PD组件、一个TiKV组件及一个TiFlash组件。两者均在操作系统为Centos 7.9,内存为8G,CPU型号为16核 Intel Xeon Processor (Cascadelake)的机器上运行。 - -OceanBase的配置文件如下所示: - -```yaml -`global: - devname: eth0 - cluster_id: 1 - memory_limit: 8G - system_memory: 4G - stack_size: 512K - cpu_count: 16 - cache_wash_threshold: 1G - __min_full_resource_pool_memory: 268435456 - workers_per_cpu_quota: 10 - schema_history_expire_time: 1d - net_thread_count: 4 - major_freeze_duty_time: Disable - minor_freeze_times: 10 - enable_separate_sys_clog: 0 - enable_merge_by_turn: FALSE - datafile_disk_percentage: 35 - syslog_level: WARN - enable_syslog_recycle: true - max_syslog_file_count: 4 - appname: obtest - mysql_port: 2883 - rpc_port: 2882 - home_path: /root/observer - data_dir: /data - redo_dir: /redo - zone: zone0 - -``` - -## 三、OceanBase基数预估准确度和TiDB的对比 - -优化器在进行基数预估时会进行均匀性(uniformity)假设,即会假定除了最频繁出现的数据,其他数据都是均匀分布的\[3\],这种假设会导致基数预估在具有倾斜分布的数据中的不准确,从而对执行计划的选择造成影响。传统的基数预估方法有直方图和采样的方法,无法对多表连接算子的基数做出准确的预估。 - -为了测试OceanBase和TiDB在不同情况下的基数预估准确度,本实验随机生成不同基数大小的单表、3表、5表链式连接负载,所有参与连接的表大小均相同,分别为10000和50000,并控制过滤谓词涉及属性数据的倾斜度分别为均匀分布、倾斜度为1的ZipFian分布及倾斜度为3的ZipFian分布,以评测OceanBase和TiDB这些场景下的基数预估情况,获得的基数预估结果包括Analyze Table之前的结果、Analyze Table(OceanBase对应的命令为Alter System Major Freeze)之后的结果以及Analyze Table之后多次Explain的结果(Explain 5次)。每个测试场景均生成10个负载。不同的优化器可能对相同的多表连接负载选定不同的连接顺序,为了消除这种影响,本实验使用相同的负载进行测试时固定其连接顺序为其对应的SQL形式中From关键字后罗列的表顺序。 - -下列表展示了单表过滤算子在不同表大小及数据倾斜度下的基数预估情况。 - - 单表过滤算子,表大小10000,数据为均匀分布 -{:.center} - -| 表大小10000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 4609 | 3323.33 | 3331.0 | 3323.33 | 4608.21 | 3334.0 | 3334.0 | -| Q2 | 2914 | 3323.33 | 3331.0 | 3323.33 | 2914.34 | 3334.0 | 3334.0 | -| Q3 | 4970 | 3333.33 | 3331.0 | 3333.33 | 4970.75 | 3334.0 | 3334.0 | -| Q4 | 5637 | 3333.33 | 3331.0 | 3333.33 | 5637.41 | 3334.0 | 3334.0 | -| Q5 | 3692 | 3333.33 | 3331.0 | 3333.33 | 3333.33 | 3334.0 | 3334.0 | -| Q6 | 6570 | 3333.33 | 3331.0 | 3333.33 | 3333.33 | 3334.0 | 3334.0 | -| Q7 | 9065 | 3333.33 | 3331.0 | 3333.33 | 9065.74 | 3334.0 | 3334.0 | -| Q8 | 2126 | 3323.33 | 3331.0 | 3323.33 | 2126.22 | 3334.0 | 3334.0 | -| Q9 | 2727 | 3323.33 | 3331.0 | 3323.33 | 2727.81 | 3334.0 | 3334.0 | -| Q10 | 6327 | 3333.33 | 3331.0 | 3333.33 | 6326.08 | 3334.0 | 3334.0 | - - 单表过滤算子,表大小10000,数据倾斜度为1 -{:.center} - -| 表大小10000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 1095 | 3333.33 | 3327.0 | 3333.33 | 1095.0 | 3334.0 | 3334.0 | -| Q2 | 1313 | 3333.33 | 3327.0 | 3333.33 | 3333.33 | 3334.0 | 3334.0 | -| Q3 | 7018 | 3323.33 | 3327.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q4 | 75 | 3333.33 | 3327.0 | 3333.33 | 75.34 | 3334.0 | 3334.0 | -| Q5 | 9019 | 3323.33 | 3327.0 | 3323.33 | 9019.0 | 3334.0 | 3334.0 | -| Q6 | 921 | 3333.33 | 3327.0 | 3333.33 | 920.06 | 3334.0 | 3334.0 | -| Q7 | 6832 | 3323.33 | 3327.0 | 3323.33 | 6833.85 | 3334.0 | 3334.0 | -| Q8 | 660 | 3333.33 | 3327.0 | 3333.33 | 3333.33 | 3334.0 | 3334.0 | -| Q9 | 9816 | 3323.33 | 3327.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q10 | 1227 | 3333.33 | 3327.0 | 3333.33 | 1225.15 | 3334.0 | 3334.0 | - - 单表过滤算子,表大小10000,数据倾斜度为3 -{:.center} - -| 表大小10000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 9994 | 3323.33 | 3327.0 | 3323.33 | 9994.0 | 3334.0 | 3334.0 | -| Q2 | 1676 | 3333.33 | 3327.0 | 3333.33 | 1676.0 | 3334.0 | 3334.0 | -| Q3 | 9997 | 3323.33 | 3327.0 | 3323.33 | 9997.0 | 3334.0 | 3334.0 | -| Q4 | 21 | 3333.33 | 3327.0 | 3333.33 | 21.0 | 3334.0 | 3334.0 | -| Q5 | 9999 | 3323.33 | 3327.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q6 | 8324 | 3323.33 | 3327.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q7 | 9949 | 3323.33 | 3327.0 | 3323.33 | 9949.0 | 3334.0 | 3334.0 | -| Q8 | 9990 | 3323.33 | 3327.0 | 3323.33 | 9990.0 | 3334.0 | 3334.0 | -| Q9 | 26 | 3333.33 | 3327.0 | 3333.33 | 26.0 | 3334.0 | 3334.0 | -| Q10 | 9979 | 3323.33 | 3327.0 | 3323.33 | 9979.0 | 3334.0 | 3334.0 | - - 单表过滤算子,表大小50000,数据为均匀分布 -{:.center} - -| 表大小50000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 7008 | 16616.67 | 16634.0 | 16616.67 | 7007.86 | 16667.0 | 16667.0 | -| Q2 | 6499 | 16666.67 | 16634.0 | 16666.67 | 6499.88 | 16667.0 | 16667.0 | -| Q3 | 17387 | 16616.67 | 16634.0 | 16616.67 | 17387.83 | 16667.0 | 16667.0 | -| Q4 | 1567 | 16666.67 | 16634.0 | 16666.67 | 16666.67 | 16667.0 | 16667.0 | -| Q5 | 5445 | 16666.67 | 16634.0 | 16666.67 | 16666.67 | 16667.0 | 16667.0 | -| Q6 | 41096 | 16666.67 | 16634.0 | 16666.67 | 41095.27 | 16667.0 | 16667.0 | -| Q7 | 38328 | 16666.67 | 16634.0 | 16666.67 | 38328.33 | 16667.0 | 16667.0 | -| Q8 | 25931 | 16616.67 | 16634.0 | 16616.67 | 25931.06 | 16667.0 | 16667.0 | -| Q9 | 32516 | 16616.67 | 16634.0 | 16616.67 | 32516.54 | 16667.0 | 16667.0 | -| Q10 | 18108 | 16616.67 | 16634.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | - - 单表过滤算子,表大小50000,数据倾斜度为1 -{:.center} - -| 表大小50000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 33948 | 16616.67 | 16627.0 | 16616.67 | 33948.0 | 16667.0 | 16667.0 | -| Q2 | 7752 | 16666.67 | 16627.0 | 16666.67 | 7742.74 | 16667.0 | 16667.0 | -| Q3 | 44944 | 16616.67 | 16627.0 | 16616.67 | 44953.26 | 16667.0 | 16667.0 | -| Q4 | 49307 | 16616.67 | 16627.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q5 | 147 | 16666.67 | 16627.0 | 16666.67 | 16666.67 | 16667.0 | 16667.0 | -| Q6 | 2948 | 16666.67 | 16627.0 | 16666.67 | 2939.95 | 16667.0 | 16667.0 | -| Q7 | 1098 | 16666.67 | 16627.0 | 16666.67 | 1099.86 | 16667.0 | 16667.0 | -| Q8 | 6932 | 16666.67 | 16627.0 | 16666.67 | 6922.74 | 16667.0 | 16667.0 | -| Q9 | 49720 | 16616.67 | 16627.0 | 16616.67 | 49719.96 | 16667.0 | 16667.0 | -| Q10 | 6201 | 16666.67 | 16627.0 | 16666.67 | 16666.67 | 16667.0 | 16667.0 | - - 单表过滤算子,表大小50000,数据倾斜度为3 -{:.center} - -| 表大小50000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 36 | 16666.67 | 16626.0 | 16666.67 | 36.0 | 16667.0 | 16667.0 | -| Q2 | 49992 | 16616.67 | 16626.0 | 16616.67 | 49992.0 | 16667.0 | 16667.0 | -| Q3 | 19 | 16666.67 | 16626.0 | 16666.67 | 19.0 | 16667.0 | 16667.0 | -| Q4 | 40 | 16666.67 | 16626.0 | 16666.67 | 40.0 | 16667.0 | 16667.0 | -| Q5 | 49823 | 16616.67 | 16626.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q6 | 177 | 16666.67 | 16626.0 | 16666.67 | 16666.67 | 16667.0 | 16667.0 | -| Q7 | 146 | 16666.67 | 16626.0 | 16666.67 | 146.0 | 16667.0 | 16667.0 | -| Q8 | 478 | 16666.67 | 16626.0 | 16666.67 | 478.0 | 16667.0 | 16667.0 | -| Q9 | 45 | 16666.67 | 16626.0 | 16666.67 | 45.0 | 16667.0 | 16667.0 | -| Q10 | 49781 | 16616.67 | 16626.0 | 16616.67 | 49781.0 | 16667.0 | 16667.0 | - -从以上单表过滤算子的基数预估情况可以看出,不管有没有Analyze Table获得统计信息,OceanBase和TiDB对于单表过滤算子的基数预估结果比较固定,与表的大小有关,会随着表大小的成比例增大。有趣的是,TiDB在多次使用Explain获取基数预估结果的过程中,其基数预估的准确度会越来越高。 - -下列表展示了3表连接算子在不同表大小及数据倾斜度下的基数预估准确度。 - -3表连接,表大小均为10000,过滤谓词涉及属性的数据为均匀分布 -{:.center} - -| 表大小10000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 272 | 5177.13 | 3263.0 | 3320.01 | 621.58 | 3334.0 | 3334.0 | -| Q2 | 1394 | 5187.52 | 3264.0 | 3320.01 | 2094.13 | 3334.0 | 3334.0 | -| Q3 | 3250 | 5182.33 | 3262.0 | 3320.01 | 5948.56 | 3334.0 | 3334.0 | -| Q4 | 1185 | 5182.33 | 3260.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q5 | 724 | 5177.13 | 3263.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q6 | 5 | 5187.52 | 3261.0 | 3323.33 | 23.08 | 3334.0 | 3334.0 | -| Q7 | 274 | 5192.71 | 3262.0 | 3323.33 | 2908.19 | 3334.0 | 3334.0 | -| Q8 | 313 | 5187.52 | 3263.0 | 3323.33 | 794.45 | 3334.0 | 3334.0 | -| Q9 | 127 | 5187.52 | 3263.0 | 3323.33 | 400.0 | 3334.0 | 3334.0 | -| Q10 | 1542 | 5182.33 | 3263.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | - - 3表连接,表大小均为10000,过滤谓词涉及属性的数据倾斜度为1 -{:.center} - -| 表大小10000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 164 | 5197.92 | 3266.0 | 3330.0 | 3330.0 | 3334.0 | 3334.0 | -| Q2 | 9 | 5203.12 | 3264.0 | 3330.0 | 9.85 | 3334.0 | 3334.0 | -| Q3 | 116 | 5192.71 | 3266.0 | 3323.33 | 466.0 | 3334.0 | 3334.0 | -| Q4 | 12 | 5187.52 | 3266.0 | 3323.33 | 254.0 | 3334.0 | 3334.0 | -| Q5 | 13 | 5177.13 | 3264.0 | 3320.01 | 3031.15 | 3334.0 | 3334.0 | -| Q6 | 1597 | 5182.33 | 3264.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q7 | 86 | 5187.52 | 3264.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q8 | 785 | 5187.52 | 3264.0 | 3323.33 | 3336.0 | 3334.0 | 3334.0 | -| Q9 | 2853 | 5166.78 | 3266.0 | 3323.33 | 4664.0 | 3334.0 | 3334.0 | -| Q10 | 5898 | 5187.52 | 3264.0 | 3323.33 | 5899.85 | 3334.0 | 3334.0 | - -3表连接,表大小均为10000,过滤谓词涉及属性的数据倾斜度为3  -{:.center} - -| 表大小10000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 8324 | 5182.33 | 3265.0 | 3316.69 | 8324.0 | 3334.0 | 3334.0 | -| Q2 | 1041 | 5187.52 | 3263.0 | 3320.01 | 1676.0 | 3334.0 | 3334.0 | -| Q3 | 438 | 5192.71 | 3263.0 | 3323.33 | 635.0 | 3334.0 | 3334.0 | -| Q4 | 10 | 5182.33 | 3263.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q5 | 9365 | 5187.52 | 3263.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q6 | 308 | 5187.52 | 3261.0 | 3323.33 | 635.0 | 3334.0 | 3334.0 | -| Q7 | 6 | 5187.5 | 3265.0 | 3323.33 | 14.0 | 3334.0 | 3334.0 | -| Q8 | 70 | 5182.33 | 3265.0 | 3323.33 | 91.0 | 3334.0 | 3334.0 | -| Q9 | 8 | 5197.92 | 3261.0 | 3333.33 | 8.0 | 3334.0 | 3334.0 | -| Q10 | 18 | 5182.33 | 3265.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | - - 3表连接,表大小均为50000,过滤谓词涉及属性的数据为均匀分布 -{:.center} - -| 表大小50000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 18758 | 25885.65 | 16335.0 | 16600.05 | 22765.17 | 16667.0 | 16667.0 | -| Q2 | 4706 | 25963.54 | 16337.0 | 16616.67 | 19569.44 | 16667.0 | 16667.0 | -| Q3 | 170 | 25937.58 | 16335.0 | 16616.67 | 170.46 | 16667.0 | 16667.0 | -| Q4 | 1632 | 25963.54 | 16335.0 | 16616.67 | 1734.37 | 16667.0 | 16667.0 | -| Q5 | 803 | 25989.61 | 16334.0 | 16650.0 | 16650.0 | 16667.0 | 16667.0 | -| Q6 | 5979 | 25937.58 | 16335.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q7 | 3236 | 25963.54 | 16334.0 | 16616.67 | 22334.68 | 16667.0 | 16667.0 | -| Q8 | 14231 | 25937.58 | 16334.0 | 16616.67 | 17668.03 | 16667.0 | 16667.0 | -| Q9 | 5402 | 26015.62 | 16335.0 | 16666.67 | 18521.98 | 16667.0 | 16667.0 | -| Q10 | 3292 | 25963.54 | 16335.0 | 16616.67 | 16069.18 | 16667.0 | 16667.0 | - - 3表连接,表大小均为50000,过滤谓词涉及属性的数据倾斜度为1 -{:.center} - -| 表大小50000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 43381 | 16600.05 | 16335.0 | 43390.26 | 43390.26 | 16667.0 | 16667.0 | -| Q2 | 9990 | 16600.05 | 16335.0 | 14423.0 | 14423.0 | 16667.0 | 16667.0 | -| Q3 | 1429 | 16600.05 | 16335.0 | 13020.0 | 13020.0 | 16667.0 | 16667.0 | -| Q4 | 278 | 16616.67 | 16335.0 | 7390.74 | 7390.74 | 16667.0 | 16667.0 | -| Q5 | 20729 | 16600.05 | 16335.0 | 20729.0 | 20729.0 | 16667.0 | 16667.0 | -| Q6 | 3249 | 16616.67 | 16335.0 | 10002.74 | 10002.74 | 16667.0 | 16667.0 | -| Q7 | 1290 | 16600.05 | 16335.0 | 1463.64 | 1463.64 | 16667.0 | 16667.0 | -| Q8 | 7169 | 16616.67 | 16335.0 | 12225.0 | 12225.0 | 16667.0 | 16667.0 | -| Q9 | 385 | 16616.67 | 16336.0 | 19938.74 | 19938.74 | 16667.0 | 16667.0 | -| Q10 | 1041 | 16616.67 | 16335.0 | 2848.74 | 2848.74 | 16667.0 | 16667.0 | - - 3表连接,表大小均为50000,过滤谓词涉及属性的数据倾斜度为3 -{:.center} - -| 表大小50000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 49329 | 16600.05 | 16305.0 | 49329.0 | 49329.0 | 16667.0 | 16667.0 | -| Q2 | 196 | 16616.67 | 16305.0 | 219.0 | 219.0 | 16667.0 | 16667.0 | -| Q3 | 15 | 16600.05 | 16306.0 | 103.0 | 103.0 | 16667.0 | 16667.0 | -| Q4 | 74 | 16616.67 | 16305.0 | 177.0 | 177.0 | 16667.0 | 16667.0 | -| Q5 | 50 | 16600.05 | 16305.0 | 51.0 | 51.0 | 16667.0 | 16667.0 | -| Q6 | 12 | 16616.67 | 16305.0 | 21.0 | 21.0 | 16667.0 | 16667.0 | -| Q7 | 193 | 16600.05 | 16304.0 | 671.0 | 671.0 | 16667.0 | 16667.0 | -| Q8 | 49897 | 16616.67 | 16305.0 | 49897.0 | 49897.0 | 16667.0 | 16667.0 | -| Q9 | 41604 | 16616.67 | 16304.0 | 41604.0 | 41604.0 | 16667.0 | 16667.0 | -| Q10 | 549 | 16616.67 | 16304.0 | 671.0 | 671.0 | 16667.0 | 16667.0 | - -从以上3表连接算子在不同表大小以及数据倾斜度下的基数预估情况来看,在Analyze Table之前,由于OceanBase和TiDB都没有统计信息,因此会把这列数据当成均匀分布来看,其结果较为固定,不会随着真实基数的改变而改变。然而,在Analyze Table之后,首次使用Explain获取TiDB的基数预估结果已经会随着真实基数的改变而改变,呈现高估的现象,而OceanBase的基数预估结果相比Major Freeze之前有所改变,但仍然是固定的数值。另外,TiDB的基数预估是不稳定的,在表大小50000,数据均匀分布的情况下,我们可以发现,在Analyze Table之后,首次使用Explain并不能获得随真实基数变化的预估结果。 - -下列表展示了5表连接算子在不同表大小及数据倾斜度下的基数预估准确度。 - -5表连接,表大小均为10000,过滤谓词涉及属性的数据为均匀分布 -{:.center} - -| 表大小10000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 15 | 8089.27 | 3199.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q2 | 88 | 8089.29 | 3202.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q3 | 1323 | 8081.18 | 3199.0 | 3320.01 | 3360.19 | 3334.0 | 3334.0 | -| Q4 | 22 | 8089.27 | 3196.0 | 3316.69 | 1569.78 | 3334.0 | 3334.0 | -| Q5 | 870 | 8105.49 | 3199.0 | 3320.01 | 870.46 | 3334.0 | 3334.0 | -| Q6 | 1731 | 8097.39 | 3199.0 | 3323.33 | 5484.2 | 3334.0 | 3334.0 | -| Q7 | 26 | 8105.49 | 3199.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q8 | 188 | 8097.36 | 3199.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q9 | 181 | 8065.02 | 3194.0 | 3316.69 | 980.68 | 3334.0 | 3334.0 | -| Q10 | 451 | 8089.29 | 3198.0 | 3320.01 | 4432.78 | 3334.0 | 3334.0 | - - 5表连接,表大小均为10000,过滤谓词涉及属性的数据倾斜度为1 -{:.center} - -| 表大小10000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 82 | 8081.18 | 3199.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q2 | 6 | 8113.61 | 3199.0 | 3323.33 | 19.89 | 3334.0 | 3334.0 | -| Q3 | 10 | 8097.39 | 3195.0 | 3323.33 | 736.15 | 3334.0 | 3334.0 | -| Q4 | 19 | 8105.49 | 3199.0 | 3320.01 | 3582.15 | 3334.0 | 3334.0 | -| Q5 | 24 | 8105.49 | 3199.0 | 3323.33 | 2027.15 | 3334.0 | 3334.0 | -| Q6 | 104 | 8065.0 | 3202.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q7 | 56 | 8073.1 | 3199.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q8 | 85 | 8081.18 | 3203.0 | 3320.01 | 3323.33 | 3334.0 | 3334.0 | -| Q9 | 23 | 8089.27 | 3199.0 | 3323.33 | 109.4 | 3334.0 | 3334.0 | -| Q10 | 648 | 8065.02 | 3203.0 | 3320.01 | 2567.15 | 3334.0 | 3334.0 | - -5表连接,表大小均为10000,过滤谓词涉及属性的数据倾斜度为3  -{:.center} - -| 表大小10000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 24 | 8105.47 | 3196.0 | 3323.33 | 91.0 | 3334.0 | 3334.0 | -| Q2 | 16 | 8097.39 | 3196.0 | 3320.01 | 67.0 | 3334.0 | 3334.0 | -| Q3 | 67 | 8089.27 | 3199.0 | 3323.33 | 197.0 | 3334.0 | 3334.0 | -| Q4 | 6 | 8089.27 | 3194.0 | 3320.01 | 32.0 | 3334.0 | 3334.0 | -| Q5 | 8324 | 8081.18 | 3194.0 | 3320.01 | 3320.01 | 3334.0 | 3334.0 | -| Q6 | 1349 | 8105.49 | 3196.0 | 3323.33 | 3323.33 | 3334.0 | 3334.0 | -| Q7 | 1041 | 8081.2 | 3197.0 | 3320.01 | 1676.0 | 3334.0 | 3334.0 | -| Q8 | 308 | 8065.02 | 3199.0 | 3320.01 | 635.0 | 3334.0 | 3334.0 | -| Q9 | 9 | 8081.2 | 3204.0 | 3320.01 | 26.0 | 3334.0 | 3334.0 | -| Q10 | 7 | 8073.1 | 3196.0 | 3320.01 | 21.0 | 3334.0 | 3334.0 | - - 5表连接,表大小均为50000,过滤谓词涉及属性的数据为均匀分布 -{:.center} - -| 表大小50000,均匀分布 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 131 | 40365.48 | 16010.0 | 16600.05 | 619.1 | 16667.0 | 16667.0 | -| Q2 | 6075 | 26015.62 | 15979.0 | 16583.45 | 16583.45 | 16667.0 | 16667.0 | -| Q3 | 30 | 32357.16 | 16010.0 | 16583.45 | 16583.45 | 16667.0 | 16667.0 | -| Q4 | 958 | 32357.16 | 15979.0 | 16600.05 | 1643.99 | 16667.0 | 16667.0 | -| Q5 | 181 | 32389.55 | 15979.0 | 1342.14 | 1342.14 | 16667.0 | 16667.0 | -| Q6 | 1263 | 32389.45 | 15979.0 | 16616.67 | 16020.82 | 16667.0 | 16667.0 | -| Q7 | 3621 | 25989.61 | 15979.0 | 16616.67 | 10199.24 | 16667.0 | 16667.0 | -| Q8 | 630 | 25963.62 | 15979.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q9 | 482 | 32421.97 | 15979.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q10 | 2143 | 25963.54 | 16042.0 | 16616.67 | 15048.5 | 16667.0 | 16667.0 | - - 5表连接,表大小均为50000,过滤谓词涉及属性的数据倾斜度为1 -{:.center} - -| 表大小50000,倾斜度1 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 6474 | 40446.45 | 15985.0 | 16583.45 | 27418.0 | 16667.0 | 16667.0 | -| Q2 | 954 | 40486.82 | 15985.0 | 16616.67 | 3095.07 | 16667.0 | 16667.0 | -| Q3 | 132 | 40446.33 | 15989.0 | 16600.05 | 3434.36 | 16667.0 | 16667.0 | -| Q4 | 459 | 40365.48 | 15989.0 | 16600.05 | 13104.74 | 16667.0 | 16667.0 | -| Q5 | 14 | 40365.48 | 16032.0 | 16600.05 | 16600.05 | 16667.0 | 16667.0 | -| Q6 | 648 | 40324.99 | 15985.0 | 16616.67 | 16616.67 | 16667.0 | 16667.0 | -| Q7 | 210 | 40405.88 | 16010.0 | 16600.05 | 2778.0 | 16667.0 | 16667.0 | -| Q8 | 53 | 40486.94 | 16007.0 | 16616.67 | 805.02 | 16667.0 | 16667.0 | -| Q9 | 416 | 40486.94 | 16010.0 | 16616.67 | 4436.74 | 16667.0 | 16667.0 | -| Q10 | 29 | 40446.33 | 16010.0 | 16616.67 | 9777.0 | 16667.0 | 16667.0 | - - 5表连接,表大小均为50000,过滤谓词涉及属性的数据倾斜度为3 -{:.center} - -| 表大小50000,倾斜度3 | 真实基数 | TiDB Analyze Table前 | OceanBase Major Freeze前 | TiDB Analyze Table后首次Explain | TiDB Analyze Table后多次Explain | OceanBase Major Freeze后首次Explain | OceanBase Major Freeze后多次Explain | -| --- | --- | --- | --- | --- | --- | --- | --- | -| Q1 | 41604 | 16600.05 | 16010.0 | 41604.0 | 41604.0 | 16667.0 | 16667.0 | -| Q2 | 180 | 16600.05 | 16010.0 | 357.0 | 357.0 | 16667.0 | 16667.0 | -| Q3 | 15 | 16600.05 | 16010.0 | 103.0 | 103.0 | 16667.0 | 16667.0 | -| Q4 | 8 | 16600.05 | 16017.0 | 66.0 | 66.0 | 16667.0 | 16667.0 | -| Q5 | 34 | 16600.05 | 16004.0 | 122.0 | 122.0 | 16667.0 | 16667.0 | -| Q6 | 5 | 16600.05 | 16010.0 | 26.0 | 26.0 | 16667.0 | 16667.0 | -| Q7 | 1542 | 16616.67 | 16010.0 | 3196.0 | 3196.0 | 16667.0 | 16667.0 | -| Q8 | 5200 | 16600.05 | 16010.0 | 8396.0 | 8396.0 | 16667.0 | 16667.0 | -| Q9 | 333 | 16616.67 | 16010.0 | 1004.0 | 1004.0 | 16667.0 | 16667.0 | -| Q10 | 10 | 16616.67 | 16017.0 | 23.0 | 23.0 | 16667.0 | 16667.0 | - -从以上5表连接算子的基数预估结果,我们可以得出与3表连接中类似的现象和结论。 - -## 四、OceanBase和TiDB对于星型连接顺序选择质量的对比 - -星型连接在数据仓库等OLAP场景中十分常见,主要包括一个事实表和多个维度表之间进行主键-外键连接,事实表一般比维度表大。数据库对于星型连接的处理能力反应了该数据库在OLAP领域的适用度。本实验控制维度表的大小范围在\[10,50\],事实表的大小分别为10000,50000,100000,500000,1000000,在不同事实表大小的情况下分别随机生成50个8表星型连接查询。基于贪心的思想,优先选择连接基数小的算子先进行连接(包括笛卡尔积),对多表星型连接进行连接顺序的重排。比如在A,B,C,D,E 5表连接中,首先两个连接基数最小的表做连接,中间结果为Join\_a;接着从剩下的表中选择与Join\_a连接基数最小的表进行连接,重复该过程直到所有的表都参与连接。本实验以重排后的连接顺序作为基准,对OceanBase和TiDB优化器选定的连接顺序进行平均执行时间的对比。为了避免执行计划缓存的影响,本实验在OceanBase和TiDB中均设置关闭执行计划缓存。 - -图2展示了维度表大小不同的情况下,两种数据库经过连接顺序重排前后的执行时间对比,横坐标表示事实表大小,纵坐标表示执行时间。可以发现,两种数据库的优化器在经典的星型连接场景下,均无法选出最优的连接顺序,存在连接顺序选择策略的提升空间。同时我们还可以从本实验场景中看出,在事实表大小为100000及以下,OceanBase和TiDB在处理星型连接时的性能接近,在事实表大小为500000和1000000时,OceanBase和TiDB处理星型连接的执行时间差异略大。 - - - -图2 OceanBase和TiDB优化器选择的连接顺序和本文基于连接基数最小原则重排后的连接顺序性能对比 -{:.center} - -为了评测两种数据库优化器对于星型连接的连接顺序选择策略的可提升空间,我们使用连接顺序重排后的执行计划作为基准计划,计算两种数据库重排前的连接顺序和重排后的连接顺序的执行时间的比值,当作执行效率提升的倍数。两种数据库的优化器对于星型连接的可提升空间如图3所示,横坐标表示事实表大小,纵坐标表示执行效率提升的倍数。由本实验可知,在事实表大小为100000及以下时,TiDB优化器对于星型连接的连接顺序选择策略的可提升空间大于OceanBase;在事实表大小为500000和1000000时,两种数据库的优化器选出的执行计划的性能和本实验的基准计划的执行性能相似。另一方面,OceanBase优化器所选的执行计划和我们重排连接顺序后的基准计划相比,其可提升空间随着事实表的增多呈现降低的趋势。 - -由于OceanBase支持Bushy Tree,我们目前的连接顺序重排算法只能基于连接基数最小原则给出基数最优的左深树,后续可改进我们的连接顺序重排算法,使得其支持Bushy Tree,从而做出更深度的连接顺序选择质量的评测。 - - - -图3 OceanBase和TiDB优化器对于星型连接的连接顺序选择策略的可提升空间 -{:.center} - -注:本实验的所有数据和负载可通过连接获取:https://drive.google.com/drive/folders/1P53_FWfusCa3xhSSZLDCBZm1VZy52hBi?usp=sharing,包括重排前的负载和重排后的负载。 - -## 五、OceanBase和TiDB对于复杂连接形式处理能力的对比 - -本节首先展示OceanBase和TiDB是否全部支持图1不同的连接形式(或连接图),随机生成有意义的7种不同连接形式的负载,查看两种数据库是否可执行,结果如下表所示。 - -| | TiDB | OceanBase | -| --- | --- | --- | -| Chain Join | 支持 | 支持 | -| Star Join | 支持 | 支持 | -| Cycle Join  | 支持 | 支持 | -| Clique Join | 支持 | 支持 | -| Cyclic Join | 支持 | 支持 | -| Tree Join | 支持 | 支持 | -| Grid Join | 支持 | 支持 | - -为了评测OceanBase和TiDB处理复杂连接形式的性能,本实验设定所有表大小均为100万,分别随机生成50个4表连接、5表连接、6表连接、7表连接、8表连接和9表连接负载,将这些负载在OceanBase和TiDB分别执行并对比整体执行时间。本实验保证负载完全能产生有意义的非空结果,负载中涉及到的复杂连接方式包括Cycle Join、Cyclic Join及Clique Join,所有连接均为主键-外键连接。 - -图4、图5和图6展示了在本文的测试场景下,OceanBase和TiDB在Clique Join、Cycle Join及Cyclic Join情况下的执行时延(Latency),横坐标表示参与连接的表数目。 - - - -图4 OceanBase和TiDB在不同连接数目的Clique Join中的执行时间 -{:.center} - - - -图5 OceanBase和TiDB在不同连接数目的Cycle Join中的执行时间 -{:.center} - - - -图6 OceanBase和TiDB在不同连接数目的Cyclic Join中的执行时间 -{:.center} - -从图4、图5和图6中可以看出,OceanBase处理复杂连接形式负载的整体时延高于TiDB,在我们随机生成的测试场景中,OceanBase处理复杂连接形式负载的时延大部分为千级别(ms),而TiDB的时延为稳定的百级别(ms)。此外,在环型连接(Cycle Join)中,OceanBase处理8表连接和9表连接的时延达到了万级别(ms)。 - -## 六、总结 - -基于本文的实验,我们总结如下: - -1.基数预估方面,在Analyze Table之前,OceanBase和TiDB都会默认数据为均匀分布,该种情况下的基数预估结果和真实基数无关,随着表大小成比例改变。在Analyze Table之后,TiDB的基数预估不固定,首次使用Explain获取预估结果和多次使用Explain获取结果可能不一致,而OceanBase经过Major Freeze后,其基数预估结果仍不会随真实基数的改变而改变。 - -2.在星型连接场景中,OceanBase和TiDB的优化器均无法选出最佳的连接顺序,其中OceanBase的优化器选择的连接顺序的质量比TiDB更接近于本文基于连接基数最小原则进行重排后的连接顺序。 - -3.在复杂连接形式的处理性能方面,在百万级别数据量的多表连接情况下,OceanBase的性能要低于TiDB,未来应在OLAP方面加强。 - -## 二、参考材料 - -\[1\] Explain, https://open.oceanbase.com/docs/observer-cn/V3.1.2/10000000000015437 - -\[2\] Join Order, https://db.in.tum.de/teaching/ws1415/queryopt/chapter3.pdf?lang=de - -\[3\] Leis, Viktor, et al. "Query optimization through the looking glass, and what we found running the join order benchmark." *The VLDB Journal* 27.5 (2018): 643-668. \ No newline at end of file diff --git a/blog/index.md b/blog/index.md index 5a3057d..31c5171 100644 --- a/blog/index.md +++ b/blog/index.md @@ -9,19 +9,10 @@ nav: {% include section.html %} -{% include search-info.html %} - -{% include blog-list.html data="posts" component="post-excerpt" %} - -{% include section.html %} - - +{% include search-box.html %} - +{% include tags.html tags=site.tags %} - +{% include list.html data="posts" component="post-excerpt" %} diff --git a/contact/index.md b/contact/index.md index d9b7e4b..1fd4455 100644 --- a/contact/index.md +++ b/contact/index.md @@ -1,5 +1,5 @@ --- -title: Contact +title: 联系我们 nav: order: 5 tooltip: Email, address, and location @@ -7,71 +7,18 @@ nav: # {% include icon.html icon="fa-regular fa-envelope" %}Contact -Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor -incididunt ut labore et dolore magna aliqua. Ut enim ad minim veniam, quis -nostrud exercitation ullamco laboris nisi ut aliquip ex ea commodo consequat. +欢迎各位同学加入 DBHammer 实验室! {% include button.html type="email" - text="jane@smith.com" - link="jane@smith.com" -%} -{% - include button.html - type="phone" - text="(555) 867-5309" - link="+1-555-867-5309" + text="rzhang@dase.ecnu.edu.cn" + link="rzhang@dase.ecnu.edu.cn" %} {% include button.html type="address" tooltip="Our location on Google Maps for easy navigation" - link="https://www.google.com/maps" -%} - -{% include section.html %} - -{% capture col1 %} - -{% - include figure.html - image="images/photo.jpg" - caption="Lorem ipsum" + link="https://www.google.com/maps/place/%E5%8D%8E%E4%B8%9C%E5%B8%88%E8%8C%83%E5%A4%A7%E5%AD%A6/@31.1437572,121.1860237,12z/data=!4m10!1m2!2m1!1z5Y2O5Lic5biI6IyD5aSn5a2m!3m6!1s0x35b2657fc9a83b9f:0x75cd3a460e8eebd9!8m2!3d31.227667!4d121.406829!15sChLljY7kuJzluIjojIPlpKflraYiA4gBAZIBB2NvbGxlZ2XgAQA!16zL20vMDFoejA2?entry=ttu&g_ep=EgoyMDI1MDEwOC4wIKXMDSoASAFQAw%3D%3D" %} -{% endcapture %} - -{% capture col2 %} - -{% - include figure.html - image="images/photo.jpg" - caption="Lorem ipsum" -%} - -{% endcapture %} - -{% include cols.html col1=col1 col2=col2 %} - -{% include section.html dark=true %} - -{% capture col1 %} -Lorem ipsum dolor sit amet -consectetur adipiscing elit -sed do eiusmod tempor -{% endcapture %} - -{% capture col2 %} -Lorem ipsum dolor sit amet -consectetur adipiscing elit -sed do eiusmod tempor -{% endcapture %} - -{% capture col3 %} -Lorem ipsum dolor sit amet -consectetur adipiscing elit -sed do eiusmod tempor -{% endcapture %} - -{% include cols.html col1=col1 col2=col2 col3=col3 %} diff --git a/news/index.md b/news/index.md index 4ab9c0a..ca8566a 100644 --- a/news/index.md +++ b/news/index.md @@ -10,23 +10,30 @@ nav:

{%- assign data = site.news -%} -{%- assign sorted_data = data | sort: "date" | reverse -%} - - - +{%- if data -%} + {%- assign sorted_data = data | sort: "date" | reverse -%} + +{%- else -%} +

暂无新闻内容。

+{%- endif -%}
\ No newline at end of file diff --git a/tools/index.md b/project/index.md similarity index 81% rename from tools/index.md rename to project/index.md index 7c7fb49..0df2362 100644 --- a/tools/index.md +++ b/project/index.md @@ -24,22 +24,30 @@ DBHammer实验室研发了多款支持数据库系统评测的工具,包括: ## 面向数据库的功能评测 -{% include toollist.html component="toolcard" data="tools" filters="group: function-evaluation" %} +{% include list.html component="card" data="projects" filter="group == 'function-evaluation'" %} {% include section.html %} + ## 面向应用的数据库性能评测 -{% include toollist.html component="toolcard" data="tools" filters="group: load-simulation" %} +{% include list.html component="card" data="projects" filter="group == 'load-simulation'" %} {% include section.html %} ## 面向新型数据库的Benchmark -{% include toollist.html component="toolcard" data="tools" filters="group: benchmark" %} +{% include list.html component="card" data="projects" filter="group == 'benchmark'" %} {% include section.html %} + ## 数据库测试平台 -{% include toollist.html component="toolcard" style="large" data="tools" filters="group: general" %} \ No newline at end of file +{% include list.html component="card" data="projects" filter="group == 'general'" %} + +{% include section.html %} + +## More + +{% include list.html component="card" data="projects" filter="!group" style="small" %} \ No newline at end of file diff --git a/research/index.md b/research/index.md index 64ed833..a777766 100644 --- a/research/index.md +++ b/research/index.md @@ -9,10 +9,10 @@ nav: -{% include section.html %} +## All {% include search-box.html %} {% include search-info.html %} -{% include list.html data="citations" component="citation" style="norich" %} +{% include list.html data="citations" component="citation" style="rich" %} diff --git a/team/index.md b/team/index.md index 280c501..fd84e14 100644 --- a/team/index.md +++ b/team/index.md @@ -11,53 +11,24 @@ nav: ## 教师 -{% - include member-list.html - data="members" - component="portrait" - style="small" - filters="role: professor" -%} +{% include list.html data="members" component="portrait" filter="role == 'professor'" %} + ## 博士研究生 -{% - include member-list.html - data="members" - component="portrait" - style="small" - filters="role: phd" -%} +{% include list.html data="members" component="portrait" filter="role == 'phd'" %} ## 硕士研究生 -{% - include member-list.html - data="members" - component="portrait" - style="small" - filters="role: post" -%} +{% include list.html data="members" component="portrait" filter="role == 'post'" %} ## 毕业博士生 -{% - include member-list.html - data="members" - component="portrait" - style="small" - filters="role: graduated_phd" -%} +{% include list.html data="members" component="portrait" filter="role == 'graduated_phd'" %} ## 毕业硕士生 -{% - include member-list.html - data="members" - component="portrait" - style="small" - filters="role: graduated_post" -%} +{% include list.html data="members" component="portrait" filter="role == 'graduated_post'" %} {% include section.html %} @@ -68,39 +39,3 @@ nav: {% include link.html type="email" link="rzhang@dase.ecnu.edu.cn" text="联系我们" icon="" style="button" %} {:.center} - - - -