001/* 002 * Licensed to the Apache Software Foundation (ASF) under one 003 * or more contributor license agreements. See the NOTICE file 004 * distributed with this work for additional information 005 * regarding copyright ownership. The ASF licenses this file 006 * to you under the Apache License, Version 2.0 (the 007 * "License"); you may not use this file except in compliance 008 * with the License. You may obtain a copy of the License at 009 * 010 * http://www.apache.org/licenses/LICENSE-2.0 011 * 012 * Unless required by applicable law or agreed to in writing, software 013 * distributed under the License is distributed on an "AS IS" BASIS, 014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 015 * See the License for the specific language governing permissions and 016 * limitations under the License. 017 */ 018package org.apache.hadoop.hbase.regionserver.querymatcher; 019 020import static org.junit.Assert.assertArrayEquals; 021import static org.junit.Assert.assertEquals; 022import static org.junit.Assert.assertFalse; 023 024import java.io.IOException; 025import java.util.ArrayList; 026import java.util.List; 027import org.apache.hadoop.hbase.Cell; 028import org.apache.hadoop.hbase.ExtendedCell; 029import org.apache.hadoop.hbase.HBaseClassTestRule; 030import org.apache.hadoop.hbase.HConstants; 031import org.apache.hadoop.hbase.KeepDeletedCells; 032import org.apache.hadoop.hbase.KeyValue; 033import org.apache.hadoop.hbase.PrivateCellUtil; 034import org.apache.hadoop.hbase.client.Scan; 035import org.apache.hadoop.hbase.filter.FilterBase; 036import org.apache.hadoop.hbase.regionserver.ScanInfo; 037import org.apache.hadoop.hbase.regionserver.querymatcher.ScanQueryMatcher.MatchCode; 038import org.apache.hadoop.hbase.testclassification.RegionServerTests; 039import org.apache.hadoop.hbase.testclassification.SmallTests; 040import org.apache.hadoop.hbase.util.EnvironmentEdgeManager; 041import org.junit.ClassRule; 042import org.junit.Test; 043import org.junit.experimental.categories.Category; 044import org.slf4j.Logger; 045import org.slf4j.LoggerFactory; 046 047@Category({ RegionServerTests.class, SmallTests.class }) 048public class TestUserScanQueryMatcher extends AbstractTestScanQueryMatcher { 049 050 @ClassRule 051 public static final HBaseClassTestRule CLASS_RULE = 052 HBaseClassTestRule.forClass(TestUserScanQueryMatcher.class); 053 054 private static final Logger LOG = LoggerFactory.getLogger(TestUserScanQueryMatcher.class); 055 056 /** 057 * This is a cryptic test. It is checking that we don't include a fake cell. See HBASE-16074 for 058 * background. 059 */ 060 @Test 061 public void testNeverIncludeFakeCell() throws IOException { 062 long now = EnvironmentEdgeManager.currentTime(); 063 // Do with fam2 which has a col2 qualifier. 064 UserScanQueryMatcher qm = UserScanQueryMatcher.create(scan, 065 new ScanInfo(this.conf, fam2, 10, 1, ttl, KeepDeletedCells.FALSE, 066 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 067 get.getFamilyMap().get(fam2), now - ttl, now, null); 068 ExtendedCell kv = new KeyValue(row1, fam2, col2, 1, data); 069 ExtendedCell cell = PrivateCellUtil.createLastOnRowCol(kv); 070 qm.setToNewRow(kv); 071 MatchCode code = qm.match(cell); 072 assertFalse(code.compareTo(MatchCode.SEEK_NEXT_COL) != 0); 073 } 074 075 @Test 076 public void testMatchExplicitColumns() throws IOException { 077 // Moving up from the Tracker by using Gets and List<KeyValue> instead 078 // of just byte [] 079 080 // Expected result 081 List<MatchCode> expected = new ArrayList<>(6); 082 expected.add(ScanQueryMatcher.MatchCode.SEEK_NEXT_COL); 083 expected.add(ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_COL); 084 expected.add(ScanQueryMatcher.MatchCode.SEEK_NEXT_COL); 085 expected.add(ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_COL); 086 expected.add(ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_ROW); 087 expected.add(ScanQueryMatcher.MatchCode.DONE); 088 089 long now = EnvironmentEdgeManager.currentTime(); 090 // 2,4,5 091 UserScanQueryMatcher qm = UserScanQueryMatcher.create( 092 scan, new ScanInfo(this.conf, fam2, 0, 1, ttl, KeepDeletedCells.FALSE, 093 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 094 get.getFamilyMap().get(fam2), now - ttl, now, null); 095 096 List<KeyValue> memstore = new ArrayList<>(6); 097 memstore.add(new KeyValue(row1, fam2, col1, 1, data)); 098 memstore.add(new KeyValue(row1, fam2, col2, 1, data)); 099 memstore.add(new KeyValue(row1, fam2, col3, 1, data)); 100 memstore.add(new KeyValue(row1, fam2, col4, 1, data)); 101 memstore.add(new KeyValue(row1, fam2, col5, 1, data)); 102 103 memstore.add(new KeyValue(row2, fam1, col1, data)); 104 105 List<ScanQueryMatcher.MatchCode> actual = new ArrayList<>(memstore.size()); 106 KeyValue k = memstore.get(0); 107 qm.setToNewRow(k); 108 109 for (KeyValue kv : memstore) { 110 actual.add(qm.match(kv)); 111 } 112 113 assertEquals(expected.size(), actual.size()); 114 for (int i = 0; i < expected.size(); i++) { 115 LOG.debug("expected " + expected.get(i) + ", actual " + actual.get(i)); 116 assertEquals(expected.get(i), actual.get(i)); 117 } 118 } 119 120 @Test 121 public void testMatch_Wildcard() throws IOException { 122 // Moving up from the Tracker by using Gets and List<KeyValue> instead 123 // of just byte [] 124 125 // Expected result 126 List<MatchCode> expected = new ArrayList<>(6); 127 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 128 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 129 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 130 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 131 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 132 expected.add(ScanQueryMatcher.MatchCode.DONE); 133 134 long now = EnvironmentEdgeManager.currentTime(); 135 UserScanQueryMatcher qm = UserScanQueryMatcher.create(scan, new ScanInfo(this.conf, fam2, 0, 1, 136 ttl, KeepDeletedCells.FALSE, HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), null, 137 now - ttl, now, null); 138 139 List<KeyValue> memstore = new ArrayList<>(6); 140 memstore.add(new KeyValue(row1, fam2, col1, 1, data)); 141 memstore.add(new KeyValue(row1, fam2, col2, 1, data)); 142 memstore.add(new KeyValue(row1, fam2, col3, 1, data)); 143 memstore.add(new KeyValue(row1, fam2, col4, 1, data)); 144 memstore.add(new KeyValue(row1, fam2, col5, 1, data)); 145 memstore.add(new KeyValue(row2, fam1, col1, 1, data)); 146 147 List<ScanQueryMatcher.MatchCode> actual = new ArrayList<>(memstore.size()); 148 149 KeyValue k = memstore.get(0); 150 qm.setToNewRow(k); 151 152 for (KeyValue kv : memstore) { 153 actual.add(qm.match(kv)); 154 } 155 156 assertEquals(expected.size(), actual.size()); 157 for (int i = 0; i < expected.size(); i++) { 158 LOG.debug("expected " + expected.get(i) + ", actual " + actual.get(i)); 159 assertEquals(expected.get(i), actual.get(i)); 160 } 161 } 162 163 /** 164 * Verify that {@link ScanQueryMatcher} only skips expired KeyValue instances and does not exit 165 * early from the row (skipping later non-expired KeyValues). This version mimics a Get with 166 * explicitly specified column qualifiers. 167 */ 168 @Test 169 public void testMatch_ExpiredExplicit() throws IOException { 170 171 long testTTL = 1000; 172 MatchCode[] expected = new MatchCode[] { ScanQueryMatcher.MatchCode.SEEK_NEXT_COL, 173 ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_COL, 174 ScanQueryMatcher.MatchCode.SEEK_NEXT_COL, 175 ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_COL, 176 ScanQueryMatcher.MatchCode.SEEK_NEXT_ROW, ScanQueryMatcher.MatchCode.DONE }; 177 178 long now = EnvironmentEdgeManager.currentTime(); 179 UserScanQueryMatcher qm = UserScanQueryMatcher.create(scan, 180 new ScanInfo(this.conf, fam2, 0, 1, testTTL, KeepDeletedCells.FALSE, 181 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 182 get.getFamilyMap().get(fam2), now - testTTL, now, null); 183 184 KeyValue[] kvs = new KeyValue[] { new KeyValue(row1, fam2, col1, now - 100, data), 185 new KeyValue(row1, fam2, col2, now - 50, data), 186 new KeyValue(row1, fam2, col3, now - 5000, data), 187 new KeyValue(row1, fam2, col4, now - 500, data), 188 new KeyValue(row1, fam2, col5, now - 10000, data), 189 new KeyValue(row2, fam1, col1, now - 10, data) }; 190 191 KeyValue k = kvs[0]; 192 qm.setToNewRow(k); 193 194 List<MatchCode> actual = new ArrayList<>(kvs.length); 195 for (KeyValue kv : kvs) { 196 actual.add(qm.match(kv)); 197 } 198 199 assertEquals(expected.length, actual.size()); 200 for (int i = 0; i < expected.length; i++) { 201 LOG.debug("expected " + expected[i] + ", actual " + actual.get(i)); 202 assertEquals(expected[i], actual.get(i)); 203 } 204 } 205 206 /** 207 * Verify that {@link ScanQueryMatcher} only skips expired KeyValue instances and does not exit 208 * early from the row (skipping later non-expired KeyValues). This version mimics a Get with 209 * wildcard-inferred column qualifiers. 210 */ 211 @Test 212 public void testMatch_ExpiredWildcard() throws IOException { 213 214 long testTTL = 1000; 215 MatchCode[] expected = 216 new MatchCode[] { ScanQueryMatcher.MatchCode.INCLUDE, ScanQueryMatcher.MatchCode.INCLUDE, 217 ScanQueryMatcher.MatchCode.SEEK_NEXT_COL, ScanQueryMatcher.MatchCode.INCLUDE, 218 ScanQueryMatcher.MatchCode.SEEK_NEXT_COL, ScanQueryMatcher.MatchCode.DONE }; 219 220 long now = EnvironmentEdgeManager.currentTime(); 221 UserScanQueryMatcher qm = UserScanQueryMatcher.create(scan, new ScanInfo(this.conf, fam2, 0, 1, 222 testTTL, KeepDeletedCells.FALSE, HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), null, 223 now - testTTL, now, null); 224 225 KeyValue[] kvs = new KeyValue[] { new KeyValue(row1, fam2, col1, now - 100, data), 226 new KeyValue(row1, fam2, col2, now - 50, data), 227 new KeyValue(row1, fam2, col3, now - 5000, data), 228 new KeyValue(row1, fam2, col4, now - 500, data), 229 new KeyValue(row1, fam2, col5, now - 10000, data), 230 new KeyValue(row2, fam1, col1, now - 10, data) }; 231 KeyValue k = kvs[0]; 232 qm.setToNewRow(k); 233 234 List<ScanQueryMatcher.MatchCode> actual = new ArrayList<>(kvs.length); 235 for (KeyValue kv : kvs) { 236 actual.add(qm.match(kv)); 237 } 238 239 assertEquals(expected.length, actual.size()); 240 for (int i = 0; i < expected.length; i++) { 241 LOG.debug("expected " + expected[i] + ", actual " + actual.get(i)); 242 assertEquals(expected[i], actual.get(i)); 243 } 244 } 245 246 private static class AlwaysIncludeAndSeekNextRowFilter extends FilterBase { 247 @Override 248 public ReturnCode filterCell(final Cell c) { 249 return ReturnCode.INCLUDE_AND_SEEK_NEXT_ROW; 250 } 251 } 252 253 @Test 254 public void testMatchWhenFilterReturnsIncludeAndSeekNextRow() throws IOException { 255 List<MatchCode> expected = new ArrayList<>(); 256 expected.add(ScanQueryMatcher.MatchCode.INCLUDE_AND_SEEK_NEXT_ROW); 257 expected.add(ScanQueryMatcher.MatchCode.DONE); 258 259 Scan scanWithFilter = new Scan(scan).setFilter(new AlwaysIncludeAndSeekNextRowFilter()); 260 261 long now = EnvironmentEdgeManager.currentTime(); 262 263 // scan with column 2,4,5 264 UserScanQueryMatcher qm = UserScanQueryMatcher.create( 265 scanWithFilter, new ScanInfo(this.conf, fam2, 0, 1, ttl, KeepDeletedCells.FALSE, 266 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 267 get.getFamilyMap().get(fam2), now - ttl, now, null); 268 269 List<KeyValue> memstore = new ArrayList<>(); 270 // ColumnTracker will return INCLUDE_AND_SEEK_NEXT_COL , and filter will return 271 // INCLUDE_AND_SEEK_NEXT_ROW, so final match code will be INCLUDE_AND_SEEK_NEXT_ROW. 272 memstore.add(new KeyValue(row1, fam2, col2, 1, data)); 273 memstore.add(new KeyValue(row2, fam1, col1, data)); 274 275 List<ScanQueryMatcher.MatchCode> actual = new ArrayList<>(memstore.size()); 276 KeyValue k = memstore.get(0); 277 qm.setToNewRow(k); 278 279 for (KeyValue kv : memstore) { 280 actual.add(qm.match(kv)); 281 } 282 283 assertEquals(expected.size(), actual.size()); 284 for (int i = 0; i < expected.size(); i++) { 285 LOG.debug("expected " + expected.get(i) + ", actual " + actual.get(i)); 286 assertEquals(expected.get(i), actual.get(i)); 287 } 288 } 289 290 private static class AlwaysIncludeFilter extends FilterBase { 291 @Override 292 public ReturnCode filterCell(final Cell c) { 293 return ReturnCode.INCLUDE; 294 } 295 } 296 297 /** 298 * Here is the unit test for UserScanQueryMatcher#mergeFilterResponse, when the number of cells 299 * exceed the versions requested in scan, we should return SEEK_NEXT_COL, but if current match 300 * code is INCLUDE_AND_SEEK_NEXT_ROW, we can optimize to choose the max step between SEEK_NEXT_COL 301 * and INCLUDE_AND_SEEK_NEXT_ROW, which is SEEK_NEXT_ROW. <br/> 302 */ 303 @Test 304 public void testMergeFilterResponseCase1() throws IOException { 305 List<MatchCode> expected = new ArrayList<>(); 306 expected.add(MatchCode.INCLUDE); 307 expected.add(MatchCode.INCLUDE); 308 expected.add(MatchCode.SEEK_NEXT_ROW); 309 310 Scan scanWithFilter = new Scan(scan).setFilter(new AlwaysIncludeFilter()).readVersions(2); 311 312 long now = EnvironmentEdgeManager.currentTime(); 313 // scan with column 2,4,5, the family with maxVersion = 3 314 UserScanQueryMatcher qm = UserScanQueryMatcher.create( 315 scanWithFilter, new ScanInfo(this.conf, fam2, 0, 3, ttl, KeepDeletedCells.FALSE, 316 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 317 get.getFamilyMap().get(fam2), now - ttl, now, null); 318 319 List<KeyValue> memstore = new ArrayList<>(); 320 memstore.add(new KeyValue(row1, fam1, col5, 1, data)); // match code will be INCLUDE 321 memstore.add(new KeyValue(row1, fam1, col5, 2, data)); // match code will be INCLUDE 322 323 // match code will be SEEK_NEXT_ROW , which is max(INCLUDE_AND_SEEK_NEXT_ROW, SEEK_NEXT_COL). 324 memstore.add(new KeyValue(row1, fam1, col5, 3, data)); 325 326 KeyValue k = memstore.get(0); 327 qm.setToNewRow(k); 328 329 for (int i = 0; i < memstore.size(); i++) { 330 assertEquals(expected.get(i), qm.match(memstore.get(i))); 331 } 332 333 scanWithFilter = new Scan(scan).setFilter(new AlwaysIncludeFilter()).readVersions(1); 334 qm = UserScanQueryMatcher.create( 335 scanWithFilter, new ScanInfo(this.conf, fam2, 0, 2, ttl, KeepDeletedCells.FALSE, 336 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 337 get.getFamilyMap().get(fam2), now - ttl, now, null); 338 339 List<KeyValue> memstore2 = new ArrayList<>(); 340 memstore2.add(new KeyValue(row2, fam1, col2, 1, data)); // match code will be INCLUDE 341 // match code will be SEEK_NEXT_COL, which is max(INCLUDE_AND_SEEK_NEXT_COL, SEEK_NEXT_COL). 342 memstore2.add(new KeyValue(row2, fam1, col2, 2, data)); 343 344 k = memstore2.get(0); 345 qm.setToNewRow(k); 346 347 assertEquals(MatchCode.INCLUDE, qm.match(memstore2.get(0))); 348 assertEquals(MatchCode.SEEK_NEXT_COL, qm.match(memstore2.get(1))); 349 } 350 351 /** 352 * Here is the unit test for UserScanQueryMatcher#mergeFilterResponse: the match code may be 353 * changed to SEEK_NEXT_COL or INCLUDE_AND_SEEK_NEXT_COL after merging with filterResponse, even 354 * if the passed match code is neither SEEK_NEXT_COL nor INCLUDE_AND_SEEK_NEXT_COL. In that case, 355 * we need to make sure that the ColumnTracker has been switched to the next column. <br/> 356 * An effective test way is: we only need to check the cell from getKeyForNextColumn(). because 357 * that as long as the UserScanQueryMatcher returns SEEK_NEXT_COL or INCLUDE_AND_SEEK_NEXT_COL, 358 * UserScanQueryMatcher#getKeyForNextColumn should return an cell whose column is larger than the 359 * current cell's. 360 */ 361 @Test 362 public void testMergeFilterResponseCase2() throws Exception { 363 List<MatchCode> expected = new ArrayList<>(); 364 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 365 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 366 expected.add(ScanQueryMatcher.MatchCode.INCLUDE); 367 expected.add(ScanQueryMatcher.MatchCode.SEEK_NEXT_COL); 368 369 Scan scanWithFilter = new Scan(scan).setFilter(new AlwaysIncludeFilter()).readVersions(3); 370 371 long now = EnvironmentEdgeManager.currentTime(); 372 373 // scan with column 2,4,5, the family with maxVersion = 5 374 UserScanQueryMatcher qm = UserScanQueryMatcher.create( 375 scanWithFilter, new ScanInfo(this.conf, fam2, 0, 5, ttl, KeepDeletedCells.FALSE, 376 HConstants.DEFAULT_BLOCKSIZE, 0, rowComparator, false), 377 get.getFamilyMap().get(fam2), now - ttl, now, null); 378 379 List<KeyValue> memstore = new ArrayList<>(); 380 381 memstore.add(new KeyValue(row1, fam1, col2, 1, data)); // match code will be INCLUDE 382 memstore.add(new KeyValue(row1, fam1, col2, 2, data)); // match code will be INCLUDE 383 memstore.add(new KeyValue(row1, fam1, col2, 3, data)); // match code will be INCLUDE 384 memstore.add(new KeyValue(row1, fam1, col2, 4, data)); // match code will be SEEK_NEXT_COL 385 386 KeyValue k = memstore.get(0); 387 qm.setToNewRow(k); 388 389 for (int i = 0; i < memstore.size(); i++) { 390 assertEquals(expected.get(i), qm.match(memstore.get(i))); 391 } 392 393 // For last cell, the query matcher will return SEEK_NEXT_COL, and the 394 // ColumnTracker will skip to the next column, which is col4. 395 ExtendedCell lastCell = memstore.get(memstore.size() - 1); 396 Cell nextCell = qm.getKeyForNextColumn(lastCell); 397 assertArrayEquals(nextCell.getQualifierArray(), col4); 398 } 399}