View Javadoc

1   /*
2    *
3    * Licensed to the Apache Software Foundation (ASF) under one
4    * or more contributor license agreements.  See the NOTICE file
5    * distributed with this work for additional information
6    * regarding copyright ownership.  The ASF licenses this file
7    * to you under the Apache License, Version 2.0 (the
8    * "License"); you may not use this file except in compliance
9    * with the License.  You may obtain a copy of the License at
10   *
11   * http://www.apache.org/licenses/LICENSE-2.0
12   *
13   * Unless required by applicable law or agreed to in writing, software
14   * distributed under the License is distributed on an "AS IS" BASIS,
15   * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16   * See the License for the specific language governing permissions and
17   * limitations under the License.
18   */
19  
20  package org.apache.hadoop.hbase.coprocessor;
21  
22  import java.io.IOException;
23  
24  import org.apache.hadoop.conf.Configuration;
25  import org.apache.hadoop.hbase.*;
26  import org.apache.hadoop.hbase.client.HTable;
27  import org.apache.hadoop.hbase.client.Put;
28  import org.apache.hadoop.hbase.client.RetriesExhaustedWithDetailsException;
29  import org.apache.hadoop.hbase.client.Durability;
30  import org.apache.hadoop.hbase.regionserver.HRegionServer;
31  import org.apache.hadoop.hbase.util.Bytes;
32  import org.apache.hadoop.hbase.regionserver.wal.WALEdit;
33  import org.junit.AfterClass;
34  import org.junit.BeforeClass;
35  import org.junit.Test;
36  import org.junit.experimental.categories.Category;
37  
38  import static org.junit.Assert.*;
39  
40  /**
41   * Tests unhandled exceptions thrown by coprocessors running on regionserver.
42   * Expected result is that the master will remove the buggy coprocessor from
43   * its set of coprocessors and throw a org.apache.hadoop.hbase.exceptions.DoNotRetryIOException
44   * back to the client.
45   * (HBASE-4014).
46   */
47  @Category(MediumTests.class)
48  public class TestRegionServerCoprocessorExceptionWithRemove {
49    public static class BuggyRegionObserver extends SimpleRegionObserver {
50      @SuppressWarnings("null")
51      @Override
52      public void prePut(final ObserverContext<RegionCoprocessorEnvironment> c,
53                         final Put put, final WALEdit edit,
54                         final Durability durability) {
55        String tableName =
56            c.getEnvironment().getRegion().getRegionInfo()
57                .getTableName().getNameAsString();
58        if (tableName.equals("observed_table")) {
59          Integer i = null;
60          i = i + 1;
61        }
62      }
63    }
64  
65    private static HBaseTestingUtility TEST_UTIL = new HBaseTestingUtility();
66  
67    @BeforeClass
68    public static void setupBeforeClass() throws Exception {
69      // set configure to indicate which cp should be loaded
70      Configuration conf = TEST_UTIL.getConfiguration();
71      conf.set(CoprocessorHost.REGION_COPROCESSOR_CONF_KEY,
72          BuggyRegionObserver.class.getName());
73      TEST_UTIL.startMiniCluster(2);
74    }
75  
76    @AfterClass
77    public static void teardownAfterClass() throws Exception {
78      TEST_UTIL.shutdownMiniCluster();
79    }
80  
81    @Test(timeout=60000)
82    public void testExceptionFromCoprocessorDuringPut()
83        throws IOException, InterruptedException {
84      // Set watches on the zookeeper nodes for all of the regionservers in the
85      // cluster. When we try to write to TEST_TABLE, the buggy coprocessor will
86      // cause a NullPointerException, which will cause the regionserver (which
87      // hosts the region we attempted to write to) to abort. In turn, this will
88      // cause the nodeDeleted() method of the DeadRegionServer tracker to
89      // execute, which will set the rsZKNodeDeleted flag to true, which will
90      // pass this test.
91  
92      TableName TEST_TABLE =
93          TableName.valueOf("observed_table");
94      byte[] TEST_FAMILY = Bytes.toBytes("aaa");
95  
96      HTable table = TEST_UTIL.createTable(TEST_TABLE, TEST_FAMILY);
97      TEST_UTIL.createMultiRegions(table, TEST_FAMILY);
98      TEST_UTIL.waitUntilAllRegionsAssigned(TEST_TABLE);
99      // Note which regionServer that should survive the buggy coprocessor's
100     // prePut().
101     HRegionServer regionServer =
102         TEST_UTIL.getRSForFirstRegionInTable(TEST_TABLE);
103 
104     // same logic as {@link TestMasterCoprocessorExceptionWithRemove},
105     // but exception will be RetriesExhaustedWithDetailException rather
106     // than DoNotRetryIOException. The latter exception is what the RegionServer
107     // will have actually thrown, but the client will wrap this in a
108     // RetriesExhaustedWithDetailException.
109     // We will verify that "DoNotRetryIOException" appears in the text of the
110     // the exception's detailMessage.
111     boolean threwDNRE = false;
112     try {
113       final byte[] ROW = Bytes.toBytes("aaa");
114       Put put = new Put(ROW);
115       put.add(TEST_FAMILY, ROW, ROW);
116       table.put(put);
117     } catch (RetriesExhaustedWithDetailsException e) {
118       // below, could call instead :
119       // startsWith("Failed 1 action: DoNotRetryIOException.")
120       // But that might be too brittle if client-side
121       // DoNotRetryIOException-handler changes its message.
122       assertTrue(e.getMessage().contains("DoNotRetryIOException"));
123       threwDNRE = true;
124     } finally {
125       assertTrue(threwDNRE);
126     }
127 
128     // Wait 3 seconds for the regionserver to abort: expected result is that
129     // it will survive and not abort.
130     for (int i = 0; i < 3; i++) {
131       assertFalse(regionServer.isAborted());
132       try {
133         Thread.sleep(1000);
134       } catch (InterruptedException e) {
135         fail("InterruptedException while waiting for regionserver " +
136             "zk node to be deleted.");
137       }
138     }
139     table.close();
140   }
141 
142 }
143