You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@kylin.apache.org by 《秦殇》!健 <ye...@foxmail.com> on 2017/03/03 04:47:27 UTC
build kylin cube occur hbase error
Hi, All. I build cube occur a lot of error. my env is kylin1.6+cdh5.7, my cdh hbase is cluster.
kylin 1.6 xx.xx.xx.32cdh1(hbase) xx.xx.xx.32 cdh2(hbase) xx.xx.xx.33cdh3(hbase) xx.xx.xx.34as follows:
2017-03-02 22:41:48,066 ERROR [pool-8-thread-1] dao.ExecutableDao:148 : error get all Jobs:org.apache.hadoop.hbase.client.RetriesExhaustedException: Failed after attempts=6, exceptions:Thu Mar 02 22:41:48 GMT+08:00 2017, null, java.net.SocketTimeoutException: callTimeout=60000, callDuration=114431: row '/execute/' on table 'kylin_metadata' at region=kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309., hostname=hf1-cdh1,60020,1488424273046, seqNum=2
at org.apache.hadoop.hbase.client.RpcRetryingCallerWithReadReplicas.throwEnrichedException(RpcRetryingCallerWithReadReplicas.java:276) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas.call(ScannerCallableWithReplicas.java:207) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas.call(ScannerCallableWithReplicas.java:60) at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200) at org.apache.hadoop.hbase.client.ClientScanner.call(ClientScanner.java:320) at org.apache.hadoop.hbase.client.ClientScanner.nextScanner(ClientScanner.java:295) at org.apache.hadoop.hbase.client.ClientScanner.initializeScannerInConstruction(ClientScanner.java:160) at org.apache.hadoop.hbase.client.ClientScanner.<init>(ClientScanner.java:155) at org.apache.hadoop.hbase.client.HTable.getScanner(HTable.java:867) at org.apache.kylin.storage.hbase.HBaseResourceStore.visitFolder(HBaseResourceStore.java:137) at org.apache.kylin.storage.hbase.HBaseResourceStore.listResourcesImpl(HBaseResourceStore.java:107) at org.apache.kylin.common.persistence.ResourceStore.listResources(ResourceStore.java:121) at org.apache.kylin.job.dao.ExecutableDao.getJobIds(ExecutableDao.java:138) at org.apache.kylin.job.manager.ExecutableManager.getAllJobIds(ExecutableManager.java:207) at org.apache.kylin.job.impl.threadpool.DefaultScheduler$FetcherRunner.run(DefaultScheduler.java:85) at java.util.concurrent.Executors$RunnableAdapter.call(Executors.java:471) at java.util.concurrent.FutureTask.runAndReset(FutureTask.java:304) at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.access$301(ScheduledThreadPoolExecutor.java:178) at java.util.concurrent.ScheduledThreadPoolExecutor$ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:293) at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145) at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:615) at java.lang.Thread.run(Thread.java:745)Caused by: java.net.SocketTimeoutException: callTimeout=60000, callDuration=114431: row '/execute/' on table 'kylin_metadata' at region=kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309., hostname=hf1-cdh1,60020,1488424273046, seqNum=2 at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:159) at org.apache.hadoop.hbase.client.ResultBoundedCompletionService$QueueingFuture.run(ResultBoundedCompletionService.java:65) ... 3 moreCaused by: java.net.ConnectException: Connection refused at sun.nio.ch.SocketChannelImpl.checkConnect(Native Method) at sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:744) at org.apache.hadoop.net.SocketIOWithTimeout.connect(SocketIOWithTimeout.java:206) at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:530) at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:494) at org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.setupConnection(RpcClientImpl.java:416) at org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.setupIOstreams(RpcClientImpl.java:722) at org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.writeRequest(RpcClientImpl.java:906) at org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.tracedWriteRequest(RpcClientImpl.java:873) at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1242) at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226) at org.apache.hadoop.hbase.ipc.AbstractRpcClient$BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331) at org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094) at org.apache.hadoop.hbase.client.ScannerCallable.openScanner(ScannerCallable.java:394) at org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:203) at org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64) at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$RetryingRPC.call(ScannerCallableWithReplicas.java:360) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$RetryingRPC.call(ScannerCallableWithReplicas.java:334) at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126) ... 4 more
Then I found one of my hbase regionserver is shutdown, bad is kylin and hbase regionserver in common machine.
I restart my regionserver. one other error occur:
Caused by: org.apache.hadoop.hbase.NotServingRegionException: org.apache.hadoop.hbase.NotServingRegionException: Region kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920) at org.apache.hadoop.hbase.regionserver.RSRpcServices.getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.callBlockingMethod(ClientProtos.java:33648) at org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133) at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108) at java.lang.Thread.run(Thread.java:745)
at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native Method) at sun.reflect.NativeConstructorAccessorImpl.newInstance(NativeConstructorAccessorImpl.java:57) at sun.reflect.DelegatingConstructorAccessorImpl.newInstance(DelegatingConstructorAccessorImpl.java:45) at java.lang.reflect.Constructor.newInstance(Constructor.java:526) at org.apache.hadoop.ipc.RemoteException.instantiateException(RemoteException.java:106) at org.apache.hadoop.ipc.RemoteException.unwrapRemoteException(RemoteException.java:95) at org.apache.hadoop.hbase.protobuf.ProtobufUtil.getRemoteException(ProtobufUtil.java:327) at org.apache.hadoop.hbase.client.ScannerCallable.openScanner(ScannerCallable.java:402) at org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:203) at org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64) at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$RetryingRPC.call(ScannerCallableWithReplicas.java:360) at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$RetryingRPC.call(ScannerCallableWithReplicas.java:334) at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126) ... 4 moreCaused by: org.apache.hadoop.hbase.ipc.RemoteWithExtrasException(org.apache.hadoop.hbase.NotServingRegionException): org.apache.hadoop.hbase.NotServingRegionException: Region kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920) at org.apache.hadoop.hbase.regionserver.RSRpcServices.getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.callBlockingMethod(ClientProtos.java:33648) at org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133) at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108) at java.lang.Thread.run(Thread.java:745)
at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1268) at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226) at org.apache.hadoop.hbase.ipc.AbstractRpcClient$BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331) at org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094) at org.apache.hadoop.hbase.client.ScannerCallable.openScanner(ScannerCallable.java:394) ... 10 more
Could you give me a help, my kylin service can not to use!!!!
回复: build kylin cube occur hbase error
Posted by 《秦殇》!健 <ye...@foxmail.com>.
thx,I will check my log careful。: )
------------------ 原始邮件 ------------------
发件人: "RuiFeng Shan";<sh...@gmail.com>;
发送时间: 2017年3月3日(星期五) 下午5:58
收件人: "dev"<de...@kylin.apache.org>;
主题: Re: build kylin cube occur hbase error
Caused by: org.apache.hadoop.hbase.NotServingRegionException:
org.apache.hadoop.hbase.NotServingRegionException: Region
kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
online on hf1-cdh1,60020,1488505545946
I think that it is beacuse your hbase regionserver failed to restart.
Firstly, you can observe the hbase web ui to make sure whether all hbase
service(master and regionserver) work well or not.
Secondly, you can find error info from hbase log files.
If hbase service work well, And then, you can restart your kylin service.
2017-03-03 12:47 GMT+08:00 《秦殇》!健 <ye...@foxmail.com>:
> Hi, All. I build cube occur a lot of error. my env is kylin1.6+cdh5.7, my
> cdh hbase is cluster.
> kylin 1.6 xx.xx.xx.32cdh1(hbase) xx.xx.xx.32 cdh2(hbase)
> xx.xx.xx.33cdh3(hbase) xx.xx.xx.34as follows:
>
> 2017-03-02 22:41:48,066 ERROR [pool-8-thread-1] dao.ExecutableDao:148 :
> error get all Jobs:org.apache.hadoop.hbase.client.RetriesExhaustedException:
> Failed after attempts=6, exceptions:Thu Mar 02 22:41:48 GMT+08:00 2017,
> null, java.net.SocketTimeoutException: callTimeout=60000,
> callDuration=114431: row '/execute/' on table 'kylin_metadata' at
> region=kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309.,
> hostname=hf1-cdh1,60020,1488424273046, seqNum=2
> at org.apache.hadoop.hbase.client.RpcRetryingCallerWithReadRepli
> cas.throwEnrichedException(RpcRetryingCallerWithReadReplicas.java:276)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas.call(
> ScannerCallableWithReplicas.java:207) at org.apache.hadoop.hbase.
> client.ScannerCallableWithReplicas.call(ScannerCallableWithReplicas.java:60)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ClientScanner.call(ClientScanner.java:320)
> at org.apache.hadoop.hbase.client.ClientScanner.
> nextScanner(ClientScanner.java:295) at org.apache.hadoop.hbase.
> client.ClientScanner.initializeScannerInConstruction(ClientScanner.java:160)
> at org.apache.hadoop.hbase.client.ClientScanner.<init>(ClientScanner.java:155)
> at org.apache.hadoop.hbase.client.HTable.getScanner(HTable.java:867)
> at org.apache.kylin.storage.hbase.HBaseResourceStore.visitFolder(HBaseResourceStore.java:137)
> at org.apache.kylin.storage.hbase.HBaseResourceStore.listResourcesImpl(HBaseResourceStore.java:107)
> at org.apache.kylin.common.persistence.ResourceStore.
> listResources(ResourceStore.java:121) at org.apache.kylin.job.dao.
> ExecutableDao.getJobIds(ExecutableDao.java:138) at
> org.apache.kylin.job.manager.ExecutableManager.getAllJobIds(ExecutableManager.java:207)
> at org.apache.kylin.job.impl.threadpool.DefaultScheduler$
> FetcherRunner.run(DefaultScheduler.java:85) at java.util.concurrent.
> Executors$RunnableAdapter.call(Executors.java:471) at
> java.util.concurrent.FutureTask.runAndReset(FutureTask.java:304) at
> java.util.concurrent.ScheduledThreadPoolExecutor$
> ScheduledFutureTask.access$301(ScheduledThreadPoolExecutor.java:178)
> at java.util.concurrent.ScheduledThreadPoolExecutor$
> ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:293) at
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
> at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:615)
> at java.lang.Thread.run(Thread.java:745)Caused by: java.net.SocketTimeoutException:
> callTimeout=60000, callDuration=114431: row '/execute/' on table
> 'kylin_metadata' at region=kylin_metadata,,1488427068259.
> 599efd68884035a133f306657bafb309., hostname=hf1-cdh1,60020,1488424273046,
> seqNum=2 at org.apache.hadoop.hbase.client.RpcRetryingCaller.
> callWithRetries(RpcRetryingCaller.java:159) at org.apache.hadoop.hbase.
> client.ResultBoundedCompletionService$QueueingFuture.run(
> ResultBoundedCompletionService.java:65) ... 3 moreCaused by:
> java.net.ConnectException: Connection refused at
> sun.nio.ch.SocketChannelImpl.checkConnect(Native Method) at
> sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:744)
> at org.apache.hadoop.net.SocketIOWithTimeout.connect(SocketIOWithTimeout.java:206)
> at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:530) at
> org.apache.hadoop.net.NetUtils.connect(NetUtils.java:494) at
> org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.
> setupConnection(RpcClientImpl.java:416) at org.apache.hadoop.hbase.ipc.
> RpcClientImpl$Connection.setupIOstreams(RpcClientImpl.java:722) at
> org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.
> writeRequest(RpcClientImpl.java:906) at org.apache.hadoop.hbase.ipc.
> RpcClientImpl$Connection.tracedWriteRequest(RpcClientImpl.java:873)
> at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1242)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient$
> BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331)
> at org.apache.hadoop.hbase.protobuf.generated.
> ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:394) at org.apache.hadoop.hbase.
> client.ScannerCallable.call(ScannerCallable.java:203) at
> org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:360) at
> org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:334) at
> org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126)
> ... 4 more
>
> Then I found one of my hbase regionserver is shutdown, bad is kylin and
> hbase regionserver in common machine.
>
>
> I restart my regionserver. one other error occur:
> Caused by: org.apache.hadoop.hbase.NotServingRegionException:
> org.apache.hadoop.hbase.NotServingRegionException: Region
> kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
> online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.
> regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920)
> at org.apache.hadoop.hbase.regionserver.RSRpcServices.
> getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.
> regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at
> org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.
> callBlockingMethod(ClientProtos.java:33648) at
> org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at
> org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at
> org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133)
> at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108)
> at java.lang.Thread.run(Thread.java:745)
> at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native
> Method) at sun.reflect.NativeConstructorAccessorImpl.newInstance(
> NativeConstructorAccessorImpl.java:57) at sun.reflect.
> DelegatingConstructorAccessorImpl.newInstance(
> DelegatingConstructorAccessorImpl.java:45) at
> java.lang.reflect.Constructor.newInstance(Constructor.java:526) at
> org.apache.hadoop.ipc.RemoteException.instantiateException(RemoteException.java:106)
> at org.apache.hadoop.ipc.RemoteException.unwrapRemoteException(RemoteException.java:95)
> at org.apache.hadoop.hbase.protobuf.ProtobufUtil.getRemoteException(ProtobufUtil.java:327)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:402) at org.apache.hadoop.hbase.
> client.ScannerCallable.call(ScannerCallable.java:203) at
> org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:360) at
> org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:334) at
> org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126)
> ... 4 moreCaused by: org.apache.hadoop.hbase.ipc.
> RemoteWithExtrasException(org.apache.hadoop.hbase.NotServingRegionException):
> org.apache.hadoop.hbase.NotServingRegionException: Region
> kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
> online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.
> regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920)
> at org.apache.hadoop.hbase.regionserver.RSRpcServices.
> getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.
> regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at
> org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.
> callBlockingMethod(ClientProtos.java:33648) at
> org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at
> org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at
> org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133)
> at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108)
> at java.lang.Thread.run(Thread.java:745)
> at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1268)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient$
> BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331)
> at org.apache.hadoop.hbase.protobuf.generated.
> ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:394) ... 10 more
> Could you give me a help, my kylin service can not to use!!!!
--
Re: build kylin cube occur hbase error
Posted by RuiFeng Shan <sh...@gmail.com>.
Caused by: org.apache.hadoop.hbase.NotServingRegionException:
org.apache.hadoop.hbase.NotServingRegionException: Region
kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
online on hf1-cdh1,60020,1488505545946
I think that it is beacuse your hbase regionserver failed to restart.
Firstly, you can observe the hbase web ui to make sure whether all hbase
service(master and regionserver) work well or not.
Secondly, you can find error info from hbase log files.
If hbase service work well, And then, you can restart your kylin service.
2017-03-03 12:47 GMT+08:00 《秦殇》!健 <ye...@foxmail.com>:
> Hi, All. I build cube occur a lot of error. my env is kylin1.6+cdh5.7, my
> cdh hbase is cluster.
> kylin 1.6 xx.xx.xx.32cdh1(hbase) xx.xx.xx.32 cdh2(hbase)
> xx.xx.xx.33cdh3(hbase) xx.xx.xx.34as follows:
>
> 2017-03-02 22:41:48,066 ERROR [pool-8-thread-1] dao.ExecutableDao:148 :
> error get all Jobs:org.apache.hadoop.hbase.client.RetriesExhaustedException:
> Failed after attempts=6, exceptions:Thu Mar 02 22:41:48 GMT+08:00 2017,
> null, java.net.SocketTimeoutException: callTimeout=60000,
> callDuration=114431: row '/execute/' on table 'kylin_metadata' at
> region=kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309.,
> hostname=hf1-cdh1,60020,1488424273046, seqNum=2
> at org.apache.hadoop.hbase.client.RpcRetryingCallerWithReadRepli
> cas.throwEnrichedException(RpcRetryingCallerWithReadReplicas.java:276)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas.call(
> ScannerCallableWithReplicas.java:207) at org.apache.hadoop.hbase.
> client.ScannerCallableWithReplicas.call(ScannerCallableWithReplicas.java:60)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ClientScanner.call(ClientScanner.java:320)
> at org.apache.hadoop.hbase.client.ClientScanner.
> nextScanner(ClientScanner.java:295) at org.apache.hadoop.hbase.
> client.ClientScanner.initializeScannerInConstruction(ClientScanner.java:160)
> at org.apache.hadoop.hbase.client.ClientScanner.<init>(ClientScanner.java:155)
> at org.apache.hadoop.hbase.client.HTable.getScanner(HTable.java:867)
> at org.apache.kylin.storage.hbase.HBaseResourceStore.visitFolder(HBaseResourceStore.java:137)
> at org.apache.kylin.storage.hbase.HBaseResourceStore.listResourcesImpl(HBaseResourceStore.java:107)
> at org.apache.kylin.common.persistence.ResourceStore.
> listResources(ResourceStore.java:121) at org.apache.kylin.job.dao.
> ExecutableDao.getJobIds(ExecutableDao.java:138) at
> org.apache.kylin.job.manager.ExecutableManager.getAllJobIds(ExecutableManager.java:207)
> at org.apache.kylin.job.impl.threadpool.DefaultScheduler$
> FetcherRunner.run(DefaultScheduler.java:85) at java.util.concurrent.
> Executors$RunnableAdapter.call(Executors.java:471) at
> java.util.concurrent.FutureTask.runAndReset(FutureTask.java:304) at
> java.util.concurrent.ScheduledThreadPoolExecutor$
> ScheduledFutureTask.access$301(ScheduledThreadPoolExecutor.java:178)
> at java.util.concurrent.ScheduledThreadPoolExecutor$
> ScheduledFutureTask.run(ScheduledThreadPoolExecutor.java:293) at
> java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1145)
> at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:615)
> at java.lang.Thread.run(Thread.java:745)Caused by: java.net.SocketTimeoutException:
> callTimeout=60000, callDuration=114431: row '/execute/' on table
> 'kylin_metadata' at region=kylin_metadata,,1488427068259.
> 599efd68884035a133f306657bafb309., hostname=hf1-cdh1,60020,1488424273046,
> seqNum=2 at org.apache.hadoop.hbase.client.RpcRetryingCaller.
> callWithRetries(RpcRetryingCaller.java:159) at org.apache.hadoop.hbase.
> client.ResultBoundedCompletionService$QueueingFuture.run(
> ResultBoundedCompletionService.java:65) ... 3 moreCaused by:
> java.net.ConnectException: Connection refused at
> sun.nio.ch.SocketChannelImpl.checkConnect(Native Method) at
> sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:744)
> at org.apache.hadoop.net.SocketIOWithTimeout.connect(SocketIOWithTimeout.java:206)
> at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:530) at
> org.apache.hadoop.net.NetUtils.connect(NetUtils.java:494) at
> org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.
> setupConnection(RpcClientImpl.java:416) at org.apache.hadoop.hbase.ipc.
> RpcClientImpl$Connection.setupIOstreams(RpcClientImpl.java:722) at
> org.apache.hadoop.hbase.ipc.RpcClientImpl$Connection.
> writeRequest(RpcClientImpl.java:906) at org.apache.hadoop.hbase.ipc.
> RpcClientImpl$Connection.tracedWriteRequest(RpcClientImpl.java:873)
> at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1242)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient$
> BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331)
> at org.apache.hadoop.hbase.protobuf.generated.
> ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:394) at org.apache.hadoop.hbase.
> client.ScannerCallable.call(ScannerCallable.java:203) at
> org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:360) at
> org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:334) at
> org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126)
> ... 4 more
>
> Then I found one of my hbase regionserver is shutdown, bad is kylin and
> hbase regionserver in common machine.
>
>
> I restart my regionserver. one other error occur:
> Caused by: org.apache.hadoop.hbase.NotServingRegionException:
> org.apache.hadoop.hbase.NotServingRegionException: Region
> kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
> online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.
> regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920)
> at org.apache.hadoop.hbase.regionserver.RSRpcServices.
> getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.
> regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at
> org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.
> callBlockingMethod(ClientProtos.java:33648) at
> org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at
> org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at
> org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133)
> at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108)
> at java.lang.Thread.run(Thread.java:745)
> at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native
> Method) at sun.reflect.NativeConstructorAccessorImpl.newInstance(
> NativeConstructorAccessorImpl.java:57) at sun.reflect.
> DelegatingConstructorAccessorImpl.newInstance(
> DelegatingConstructorAccessorImpl.java:45) at
> java.lang.reflect.Constructor.newInstance(Constructor.java:526) at
> org.apache.hadoop.ipc.RemoteException.instantiateException(RemoteException.java:106)
> at org.apache.hadoop.ipc.RemoteException.unwrapRemoteException(RemoteException.java:95)
> at org.apache.hadoop.hbase.protobuf.ProtobufUtil.getRemoteException(ProtobufUtil.java:327)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:402) at org.apache.hadoop.hbase.
> client.ScannerCallable.call(ScannerCallable.java:203) at
> org.apache.hadoop.hbase.client.ScannerCallable.call(ScannerCallable.java:64)
> at org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithoutRetries(RpcRetryingCaller.java:200)
> at org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:360) at
> org.apache.hadoop.hbase.client.ScannerCallableWithReplicas$
> RetryingRPC.call(ScannerCallableWithReplicas.java:334) at
> org.apache.hadoop.hbase.client.RpcRetryingCaller.callWithRetries(RpcRetryingCaller.java:126)
> ... 4 moreCaused by: org.apache.hadoop.hbase.ipc.
> RemoteWithExtrasException(org.apache.hadoop.hbase.NotServingRegionException):
> org.apache.hadoop.hbase.NotServingRegionException: Region
> kylin_metadata,,1488427068259.599efd68884035a133f306657bafb309. is not
> online on hf1-cdh1,60020,1488505545946 at org.apache.hadoop.hbase.
> regionserver.HRegionServer.getRegionByEncodedName(HRegionServer.java:2920)
> at org.apache.hadoop.hbase.regionserver.RSRpcServices.
> getRegion(RSRpcServices.java:1053) at org.apache.hadoop.hbase.
> regionserver.RSRpcServices.scan(RSRpcServices.java:2385) at
> org.apache.hadoop.hbase.protobuf.generated.ClientProtos$ClientService$2.
> callBlockingMethod(ClientProtos.java:33648) at
> org.apache.hadoop.hbase.ipc.RpcServer.call(RpcServer.java:2170) at
> org.apache.hadoop.hbase.ipc.CallRunner.run(CallRunner.java:109) at
> org.apache.hadoop.hbase.ipc.RpcExecutor.consumerLoop(RpcExecutor.java:133)
> at org.apache.hadoop.hbase.ipc.RpcExecutor$1.run(RpcExecutor.java:108)
> at java.lang.Thread.run(Thread.java:745)
> at org.apache.hadoop.hbase.ipc.RpcClientImpl.call(RpcClientImpl.java:1268)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient.callBlockingMethod(AbstractRpcClient.java:226)
> at org.apache.hadoop.hbase.ipc.AbstractRpcClient$
> BlockingRpcChannelImplementation.callBlockingMethod(AbstractRpcClient.java:331)
> at org.apache.hadoop.hbase.protobuf.generated.
> ClientProtos$ClientService$BlockingStub.scan(ClientProtos.java:34094)
> at org.apache.hadoop.hbase.client.ScannerCallable.
> openScanner(ScannerCallable.java:394) ... 10 more
> Could you give me a help, my kylin service can not to use!!!!
--