[ https://issues.apache.org/jira/browse/HAWQ-842?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15341375#comment-15341375 ]
Lin Wen commented on HAWQ-842: ------------------------------ This failure is due to Fair scheduler is not supported yet. So close it. A new jira will be created for supporting for Fair scheduler. Thanks! > Failed to acquire resource from resource manager > ------------------------------------------------ > > Key: HAWQ-842 > URL: https://issues.apache.org/jira/browse/HAWQ-842 > Project: Apache HAWQ > Issue Type: Bug > Components: Resource Manager > Reporter: Bill Wailliam > Assignee: Lei Chang > > This is the pg_log: > 2016-06-20 17:56:03.864644 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","database system > was shut down at 2016-06-20 17:54:32 CST",,,,,,,0,,"xlog.c",6205, > 2016-06-20 17:56:03.864908 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","checkpoint > record is at 0/2672EF8",,,,,,,0,,"xlog.c",6304, > 2016-06-20 17:56:03.864923 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","redo record is > at 0/2672EF8; undo record is at 0/0; shutdown TRUE",,,,,,,0,,"xlog.c",6338, > 2016-06-20 17:56:03.864933 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","next > transaction ID: 0/1284; next OID: 16514",,,,,,,0,,"xlog.c",6342, > 2016-06-20 17:56:03.864942 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","next > MultiXactId: 1; next MultiXactOffset: 0",,,,,,,0,,"xlog.c",6345, > 2016-06-20 17:56:03.864951 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","end of > transaction log location is 0/2672F48",,,,,,,0,,"xlog.c",6582, > 2016-06-20 17:56:03.865750 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","Oldest active > transaction from prepared transactions 1284",,,,,,,0,,"xlog.c",5996, > 2016-06-20 17:56:03.867372 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","database system > is ready",,,,,,,0,,"xlog.c",6022, > 2016-06-20 17:56:03.867394 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","PostgreSQL > 8.2.15 (Greenplum Database 4.2.0 build 1) (HAWQ 2.0.0.0 build dev) on > x86_64-unknown-linux-gnu, compiled by GCC gcc (GCC) 4.8.0 compiled on Jun 19 > 2016 03:02:01",,,,,,,0,,"xlog.c",6032, > 2016-06-20 17:56:03.868503 > CST,,,p526096,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","Finished normal > startup for clean shutdown case",,,,,,,0,,"xlog.c",6810, > 2016-06-20 17:56:03.876213 > CST,,,p526097,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","Finished > startup integrity checking",,,,,,,0,,"xlog.c",7159, > 2016-06-20 17:56:03.879998 > CST,,,p526104,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","HAWQ Segment RM > :: Temporary directory /data1/hawq/tmp",,,,,,,0,,"resourcemanager.c",1055, > 2016-06-20 17:56:03.880039 > CST,,,p526104,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","checkAndBuildFailedTmpDirList > finished checking temporary directory, which costs 41 > us",,,,,,,0,,"resourcemanager_RMSEG.c",274, > 2016-06-20 17:56:03.883958 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","YARN mode > resource broker created resource broker process > PID=526105.",,,,,,,0,,"resourcebroker_LIBYARN.c",158, > 2016-06-20 17:56:03.884155 > CST,,,p526105,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","YARN mode > resource broker accepted YARN connection arguments : YARN Server > RM_IP_XXXXXX:8032 Scheduler server RM_IP_XXXXXX:8030 Queue hawq Application > name hawq, by user:postgres",,,,,,,0,,"resourcebroker_LIBYARN_proc.c",501, > 2016-06-20 17:56:03.884283 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","Resource > manager starts accepting resource request. Listening normal socket port 5437. > Total listened 1 FDs.",,,,,,,0,,"resourcemanager.c",2492, > 2016-06-20 17:56:03.884378 > CST,,,p526094,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","Wait for HAWQ > RM -1",,,,,,,0,,"resourcemanager.c",421, > 2016-06-20 17:56:03.884409 > CST,,,p526094,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","HAWQ :: > Received signal notification that HAWQ RM works > now.",,,,,,,0,,"resourcemanager.c",429, > 2016-06-20 17:56:03.884424 > CST,,,p526094,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","PostgreSQL > 8.2.15 (Greenplum Database 4.2.0 build 1) (HAWQ 2.0.0.0 build dev) on > x86_64-unknown-linux-gnu, compiled by GCC gcc (GCC) 4.8.0 compiled on Jun 19 > 2016 03:02:03",,,,,,,0,,"postmaster.c",3694, > 2016-06-20 17:56:03.884441 > CST,,,p526094,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","database system > is ready to accept connections","PostgreSQL 8.2.15 (Greenplum Database 4.2.0 > build 1) (HAWQ 2.0.0.0 build dev) on x86_64-unknown-linux-gnu, compiled by > GCC gcc (GCC) 4.8.0 compiled on Jun 19 2016 > 03:02:03",,,,,,0,,"postmaster.c",3701, > 2016-06-20 17:56:03.885673 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.885486, p526105, th140510358382816, INFO > ApplicationClient session auth method : > simple",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.892215 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","Cleanup > segment configuration catalog table > successfully!",,,,,,,0,,"resourcepool.c",460, > 2016-06-20 17:56:03.892604 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.892561, p526105, th140510358382816, INFO Yarn RM HA is > not configured.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.892643 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.892600, p526105, th140510358382816, INFO > ApplicationClient Resource Manager HA is > disable.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.893081 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.893051, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto is > called.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.893116 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.893068, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto, current is > 0.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.895989 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.895940, p526105, th140510358382816, INFO > LibYarnClient::createJob, getNewApplication finished, > appId:[clusterTimeStamp:1466415720399,id:2]",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.896107 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.896075, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto is > called.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.896151 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.896094, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto, current is > 0.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.896602 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","Cleanup > segment configuration history catalog table successfully, keep period: recent > 365 days.",,,,,,,0,,"resourcepool.c",530, > 2016-06-20 17:56:03.897807 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.897769, p526105, th140510358382816, INFO > LibYarnClient::createJob, submitApplication > finished",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.897862 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.897833, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto is > called.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.897898 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.897851, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto, current is > 0.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.901293 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","Add a new > row into segment configuration catalog table,registration order:0, role:m, > status:u, port:5432, hostname:Master_ip, address:Master_ip, > description:",,,,,,,0,,"resourcepool.c",879, > 2016-06-20 17:56:03.901503 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.901443, p526105, th140510358382816, INFO > LibYarnClient::createJob, appId[cluster_timestamp:1466415720399,id:2], > appState:4",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.901535 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > 2016-06-20 17:56:03.901492, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto is called. > 2016-06-20 17:56:03.901502, p526105, th140510358382816, INFO > ApplicationClient::getActiveAppClientProto, current is > 0.",,,,,,,,"SysLoggerMain","syslogger.c",518, > 2016-06-20 17:56:03.905203 > CST,,,p526104,th503294176,,,,0,con4,,seg-10000,,,,,"LOG","00000","Resource > manager successfully loaded role > specifications.",,,,,,,0,,"resourcemanager.c",1272, > 2016-06-20 17:56:03.907677 > CST,,,p526095,th503294176,,,,0,,,seg-10000,,,,,"LOG","00000","3rd party error > log: > hawq-site.xml: > <configuration> > <property> > <name>hawq_master_address_host</name> > <value>HAWQ_Master</value> > <description>The host name of hawq master.</description> > </property> > <property> > <name>hawq_master_address_port</name> > <value>5432</value> > <description>The port of hawq master.</description> > </property> > <property> > <name>hawq_standby_address_host</name> > <value>none</value> > <description>The host name of hawq standby master.</description> > </property> > <property> > <name>hawq_segment_address_port</name> > <value>40000</value> > <description>The port of hawq segment.</description> > </property> > <property> > <name>hawq_dfs_url</name> > <value>thallo/hawq_default</value> > <description>URL for accessing HDFS.</description> > </property> > <property> > <name>hawq_master_directory</name> > <value>/data1/hawq-data-directory/masterdd</value> > <description>The directory of hawq master.</description> > </property> > <property> > <name>hawq_segment_directory</name> > <value>/data1/hawq-data-directory/segmentdd</value> > <description>The directory of hawq segment.</description> > </property> > <property> > <name>hawq_master_temp_directory</name> > <value>/data1/hawq/tmp</value> > <description>The temporary directory reserved for hawq > master.</description> > </property> > <property> > <name>hawq_segment_temp_directory</name> > <value>/data1/hawq/tmp</value> > <description>The temporary directory reserved for hawq > segment.</description> > </property> > > <!-- HAWQ resource manager parameters --> > <property> > <name>hawq_global_rm_type</name> > <value>yarn</value> > <description>The resource manager type to start for allocating > resource. > 'none' means hawq resource manager > exclusively uses whole > cluster; 'yarn' means hawq resource > manager contacts YARN > resource manager to negotiate resource. > </description> > </property> > <property> > <name>hawq_rm_memory_limit_perseg</name> > <value>64GB</value> > <description>The limit of memory usage in a hawq segment when > hawq_global_rm_type is set 'none'. > </description> > </property> > <property> > <name>hawq_rm_nvcore_limit_perseg</name> > <value>16</value> > <description>The limit of virtual core usage in a hawq segment > when > hawq_global_rm_type is set 'none'. > </description> > </property> > <property> > <name>hawq_rm_yarn_address</name> > <value>RM_IP:8032</value> > <description>The address of YARN resource manager > server.</description> > </property> > <property> > <name>hawq_rm_yarn_scheduler_address</name> > <value>RM_IP:8030</value> > <description>The address of YARN scheduler server.</description> > </property> > <property> > <name>hawq_rm_yarn_queue_name</name> > <value>hawq</value> > <description>The YARN queue name to register hawq resource > manager.</description> > </property> > <property> > <name>hawq_rm_yarn_app_name</name> > <value>hawq</value> > <description>The application name to register hawq resource > manager in YARN.</description> > </property> > <!-- HAWQ resource manager parameters end here. --> > <!-- HAWQ resource enforcement parameters --> > <property> > <name>hawq_re_cpu_enable</name> > <value>false</value> > <description>The control to enable/disable CPU resource > enforcement.</description> > </property> > <property> > <name>hawq_re_cgroup_mount_point</name> > <value>/sys/fs/cgroup</value> > <description>The mount point of CGroup file system for resource > enforcement. > For example, /sys/fs/cgroup/cpu/hawq > for CPU sub-system. > </description> > </property> > <property> > <name>hawq_re_cgroup_hierarchy_name</name> > <value>hawq</value> > <description>The name of the hierarchy to accomodate CGroup > directories/files for resource enforcement. > For example, /sys/fs/cgroup/cpu/hawq > for CPU sub-system. > </description> > </property> > <!-- HAWQ resource enforcement parameters end here. --> > <property> > <name>default_hash_table_bucket_number</name> > <value>6</value> > </property> > </configuration> -- This message was sent by Atlassian JIRA (v6.3.4#6332)