Am 13.02.2013 um 18:22 schrieb Jebu Rajan:

> Thanks Reuti.
> 
> It's in /etc/hosts
> 
> [quantuser@quant linux-x64]$ cat /etc/hosts
> 127.0.0.1   localhost
> ::1         localhost
> 192.168.0.40 quant.simbox1
> 
> The error messages are
> [quantuser@quant linux-x64]$ cat /tmp/sge_messages
> 02/13/2013 14:19:48|  main|quant|C|abort qmaster startup due to communication 
> errors
> 02/13/2013 14:29:35|  main|quant|C|abort qmaster startup due to communication 
> errors
> 02/13/2013 14:32:44|  main|quant|C|abort qmaster startup due to communication 
> errors
> 02/13/2013 14:35:07|  main|quant|C|abort qmaster startup due to communication 
> errors
> 02/13/2013 14:37:38|  main|quant|C|abort qmaster startup due to communication 
> errors
> 
> 
> It's on eth1 rather than eth0!
> 
> [quantuser@quant linux-x64]$ ifconfig eth1
> eth1      Link encap:Ethernet  HWaddr 90:E2:BA:20:E6:E9
>          inet addr:192.168.0.40  Bcast:192.168.0.255 Mask:255.255.255.0

Then you might need a $SGE_ROOT/default/common/host_aliases file with a line:

quant the.fqdn.of.eth0

assuming eth0 is the external interface of the machine.

-- Reuti

> 
> Thanks
> 
> 
> On 13/02/2013 17:15, Reuti wrote:
>> Am 13.02.2013 um 18:04 schrieb Jebu Rajan:
>> 
>>> Hi
>>> 
>>> I've been trying to get GE running on SL6.  I've been able to build 
>>> ge2011.11 but seem to have some outstanding problems with environment 
>>> settings.
>>> 
>>> All the usual name resolution stuff also seems to be fine.
>>> 
>>> [quantuser@quant linux-x64]$ hostname
>>> quant.simbox1
>>> 
>>> [quantuser@quant linux-x64]$ ./gethostname
>>> Hostname: quant.simbox1
>>> Aliases:
>>> Host Address(es): 192.168.0.40
>>> 
>>> [quantuser@quant linux-x64]$ ./gethostbyname quant.simbox1
>>> Hostname: quant.simbox1
>>> Aliases:
>>> Host Address(es): 192.168.0.40
>>> 
>>> [quantuser@quant linux-x64]$ ./gethostbyaddr 192.168.0.40
>>> Hostname: quant.simbox1
>>> Aliases:
>>> Host Address(es): 192.168.0.40
>>> 
>>> 
>>> However when I try to start up I get
>> This information is also in /etc/hosts?
>> 
>> Is there any file in /tmp of the qmaster with some hints?
>> 
>> The address 192.168.0.40 is on eth0?
>> 
>> -- Reuti
>> 
>> 
>>> Grid Engine qmaster startup
>>> ---------------------------
>>> 
>>> Starting qmaster daemon. Please wait ...
>>>   starting sge_qmaster
>>> 
>>> sge_qmaster start problem
>>> 
>>> sge_qmaster didn't start!
>>> sge_qmaster start problem
>>> 
>>> 
>>> With debug on I can see that there are various  "reresolve hostname failed: 
>>> can't resolve host name" errors (see below)
>>> 
>>> Any help would be appreciated?
>>> 
>>> Thanks in advance
>>> 
>>> Jebber
>>> 
>>> 
>>> [root@quant linux-x64]# ./sge_qmaster
>>>     0   1414 140491200812800 --> qmaster() {
>>>     1   1414 140491200812800 --> sge_monitor_init() {
>>>     2   1414 140491200812800 --> sge_gettext_() {
>>>     3   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>     4   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>     5   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>     6   1414 140491200812800 --> sge_monitor_reset() {
>>>     7   1414 140491200812800 <-- sge_monitor_reset() 
>>> ../libs/uti/sge_monitor.c 648 }
>>>     8   1414 140491200812800 --> sge_set_last_wait_time() {
>>>     9   1414 140491200812800 <-- sge_set_last_wait_time() 
>>> ../libs/uti/sge_monitor.c 530 }
>>>    10   1414 140491200812800 <-- sge_monitor_init() 
>>> ../libs/uti/sge_monitor.c 358 }
>>>    11   1414 140491200812800 --> init_array() {
>>>    12   1414 140491200812800 <-- init_array() ../libs/uti/sge_profiling.c 
>>> 1585 }
>>>    13   1414 140491200812800 --> sge_get_root_dir() {
>>>    14   1414 140491200812800 <-- sge_get_root_dir() ../libs/uti/sge_arch.c 
>>> 136 }
>>>    15   1414 140491200812800 --> sge_init_language_func() {
>>>    16   1414 140491200812800 <-- sge_init_language_func() 
>>> ../libs/uti/sge_language.c 455 }
>>>    17   1414 140491200812800 --> sge_init_language() {
>>>    18   1414 140491200812800     ****** starting localization procedure ... 
>>> **********
>>>    19   1414 140491200812800     could not get environment variable 
>>> "GRIDPACKAGE"
>>>    20   1414 140491200812800     could not get environment variable 
>>> "GRIDLOCALEDIR"
>>>    21   1414 140491200812800 --> sge_get_root_dir() {
>>>    22   1414 140491200812800 <-- sge_get_root_dir() ../libs/uti/sge_arch.c 
>>> 136 }
>>>    23   1414 140491200812800     setlocale() returns "en_US.UTF-8"
>>>    24   1414 140491200812800     cutting of language string after "_":
>>>    25   1414 140491200812800     locale directory: 
>>> >/home/quantuser/gridengine/ge2011.11/locale<
>>>    26   1414 140491200812800     package file: >linux-x64/gridengine.mo<
>>>    27   1414 140491200812800     language (LANG):  >en<
>>>    28   1414 140491200812800     loading message file: 
>>> /home/quantuser/gridengine/ge2011.11/locale/en/LC_MESSAGES/linux-x64/gridengine.mo
>>>    29   1414 140491200812800     could not open message file - error
>>>    30   1414 140491200812800     setlocale() returns "en_US.UTF-8"
>>>    31   1414 140491200812800     bindtextdomain() returns 
>>> "/home/quantuser/gridengine/ge2011.11/locale"
>>>    32   1414 140491200812800     textdomain() returns "linux-x64/gridengine"
>>>    33   1414 140491200812800     error id output     : disabled
>>>    34   1414 140491200812800     ****** starting localization procedure ... 
>>> failed  **
>>>    35   1414 140491200812800 <-- sge_init_language() 
>>> ../libs/uti/sge_language.c 381 }
>>>    36   1414 140491200812800 --> sge_daemonize_qmaster() {
>>>    37   1414 140491200812800     sge_qmaster is not daemonized
>>>    38   1414 140491200812800 <-- sge_daemonize_qmaster() 
>>> ../daemons/qmaster/sge_qmaster_threads.c 188 }
>>>    39   1414 140491200812800 --> sge_qmaster_thread_init() {
>>>    40   1414 140491200812800 --> sge_setup2() {
>>>    41   1414 140491200812800 --> sge_get_qmaster_port() {
>>>    42   1414 140491200812800     returning port value: 6444
>>>    43   1414 140491200812800 <-- sge_get_qmaster_port() 
>>> ../libs/uti/sge_hostname.c 219 }
>>>    44   1414 140491200812800 --> sge_get_execd_port() {
>>>    45   1414 140491200812800     returning port value: 6445
>>>    46   1414 140491200812800 <-- sge_get_execd_port() 
>>> ../libs/uti/sge_hostname.c 286 }
>>>    47   1414 140491200812800 --> sge_uid2user() {
>>>    48   1414 140491200812800 <-- sge_uid2user() ../libs/uti/sge_uidgid.c 
>>> 695 }
>>>    49   1414 140491200812800 --> sge_gid2group() {
>>>    50   1414 140491200812800 --> sge_getgrgid_r() {
>>>    51   1414 140491200812800 <-- sge_getgrgid_r() ../libs/uti/sge_uidgid.c 
>>> 1349 }
>>>    52   1414 140491200812800 <-- sge_gid2group() ../libs/uti/sge_uidgid.c 
>>> 762 }
>>>    53   1414 140491200812800 --> sge_gdi_ctx_class_create() {
>>>    54   1414 140491200812800 --> sge_gdi_ctx_setup() {
>>>    55   1414 140491200812800 --> sge_env_state_class_create() {
>>>    56   1414 140491200812800 --> sge_env_state_setup() {
>>>    57   1414 140491200812800 <-- sge_env_state_setup() 
>>> ../libs/uti/sge_env.c 157 }
>>>    58   1414 140491200812800 <-- sge_env_state_class_create() 
>>> ../libs/uti/sge_env.c 126 }
>>>    59   1414 140491200812800 --> sge_prog_state_class_create() {
>>>    60   1414 140491200812800 --> sge_prog_state_setup() {
>>>    61   1414 140491200812800 --> sge_gethostbyname() {
>>>    62   1414 140491200812800     Getting host by name - Linux
>>>    63   1414 140491200812800 --> sge_copy_hostent() {
>>>    64   1414 140491200812800     1 names in h_addr_list
>>>    65   1414 140491200812800     0 names in h_aliases
>>>    66   1414 140491200812800 <-- sge_copy_hostent() 
>>> ../libs/uti/sge_hostname.c 659 }
>>>    67   1414 140491200812800 <-- sge_gethostbyname() 
>>> ../libs/uti/sge_hostname.c 577 }
>>>    68   1414 140491200812800 <-- sge_prog_state_setup() 
>>> ../libs/uti/sge_prog.c 895 }
>>>    69   1414 140491200812800 <-- sge_prog_state_class_create() 
>>> ../libs/uti/sge_prog.c 808 }
>>>    70   1414 140491200812800 --> sge_path_state_class_create() {
>>>    71   1414 140491200812800 --> sge_path_state_setup() {
>>>    72   1414 140491200812800 <-- sge_path_state_setup() 
>>> ../libs/uti/setup_path.c 692 }
>>>    73   1414 140491200812800 <-- sge_path_state_class_create() 
>>> ../libs/uti/setup_path.c 585 }
>>>    74   1414 140491200812800 --> sge_bootstrap_state_class_create() {
>>>    75   1414 140491200812800 --> sge_bootstrap_state_class_init() {
>>>    76   1414 140491200812800 <-- sge_bootstrap_state_class_init() 
>>> ../libs/uti/sge_bootstrap.c 715 }
>>>    77   1414 140491200812800 --> sge_bootstrap_state_setup() {
>>>    78   1414 140491200812800 --> sge_get_confval_array() {
>>>    79   1414 140491200812800 <-- sge_get_confval_array() 
>>> ../libs/uti/sge_spool.c 656 }
>>>    80   1414 140491200812800 <-- sge_bootstrap_state_setup() 
>>> ../libs/uti/sge_bootstrap.c 866 }
>>>    81   1414 140491200812800 <-- sge_bootstrap_state_class_create() 
>>> ../libs/uti/sge_bootstrap.c 663 }
>>>    82   1414 140491200812800 --> feature_initialize_from_string() {
>>>    83   1414 140491200812800 --> feature_get_featureset_id() {
>>>    84   1414 140491200812800 <-- feature_get_featureset_id() 
>>> ../libs/sgeobj/sge_feature.c 413 }
>>>    85   1414 140491200812800 --> feature_activate() {
>>>    86   1414 140491200812800 <-- feature_activate() 
>>> ../libs/sgeobj/sge_feature.c 300 }
>>>    87   1414 140491200812800 <-- feature_initialize_from_string() 
>>> ../libs/sgeobj/sge_feature.c 200 }
>>>    88   1414 140491200812800 --> sge_csp_path_class_create() {
>>>    89   1414 140491200812800 --> sge_csp_path_setup() {
>>>    90   1414 140491200812800 
>>> sge_csp_path_setup:../libs/uti/sge_csp_path.c:316
>>>    91   1414 140491200812800 <-- sge_csp_path_setup() 
>>> ../libs/uti/sge_csp_path.c 447 }
>>>    92   1414 140491200812800 <-- sge_csp_path_class_create() 
>>> ../libs/uti/sge_csp_path.c 265 }
>>>    93   1414 140491200812800 --> sge_getpwnam_r() {
>>>    94   1414 140491200812800 <-- sge_getpwnam_r() ../libs/uti/sge_uidgid.c 
>>> 1294 }
>>>    95   1414 140491200812800 --> sge_group2gid() {
>>>    96   1414 140491200812800 <-- sge_group2gid() ../libs/uti/sge_uidgid.c 
>>> 627 }
>>>    97   1414 140491200812800 <-- sge_gdi_ctx_setup() 
>>> ../libs/gdi/sge_gdi_ctx.c 728 }
>>>    98   1414 140491200812800 <-- sge_gdi_ctx_class_create() 
>>> ../libs/gdi/sge_gdi_ctx.c 461 }
>>>    99   1414 140491200812800 --> sge_gdi_set_thread_local_ctx() {
>>>   100   1414 140491200812800 --> sge_bootstrap_state_set_thread_local() {
>>>   101   1414 140491200812800 --> sge_bootstrap_state_class_init() {
>>>   102   1414 140491200812800 <-- sge_bootstrap_state_class_init() 
>>> ../libs/uti/sge_bootstrap.c 715 }
>>>   103   1414 140491200812800 <-- sge_bootstrap_state_set_thread_local() 
>>> ../libs/uti/sge_bootstrap.c 159 }
>>>   104   1414 140491200812800 <-- sge_gdi_set_thread_local_ctx() 
>>> ../libs/gdi/sge_gdi_ctx.c 247 }
>>>   105   1414 140491200812800 <-- sge_setup2() ../libs/gdi/sge_gdi_ctx.c 
>>> 1957 }
>>>   106   1414 140491200812800 --> gdi2_reresolve_qualified_hostname() {
>>>   107   1414 140491200812800 --> sge_gethostbyname() {
>>>   108   1414 140491200812800     Getting host by name - Linux
>>>   109   1414 140491200812800 <-- sge_gethostbyname() 
>>> ../libs/uti/sge_hostname.c 577 }
>>>   110   1414 140491200812800 --> sge_gettext_() {
>>>   111   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>   112   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>   113   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>   114   1414 140491200812800 <-- gdi2_reresolve_qualified_hostname() 
>>> ../libs/gdi/sge_gdi_ctx.c 2004 }
>>>   115   1414 140491200812800 <-- sge_qmaster_thread_init() 
>>> ../daemons/qmaster/setup_qmaster.c 258 }
>>>   116   1414 140491200812800 --> sge_gdi_ctx_class_prepare_enroll() {
>>>   117   1414 140491200812800 --> sge_gettext_() {
>>>   118   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>   119   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>   120   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>   121   1414         main --> gdi2_reresolve_qualified_hostname() {
>>>   122   1414         main --> sge_gethostbyname() {
>>>   123   1414         main     Getting host by name - Linux
>>>   124   1414         main <-- sge_gethostbyname() 
>>> ../libs/uti/sge_hostname.c 577 }
>>>   125   1414 140491200812800 --> sge_gettext_() {
>>>   126   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>   127   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>   128   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>   129   1414         main <-- gdi2_reresolve_qualified_hostname() 
>>> ../libs/gdi/sge_gdi_ctx.c 2004 }
>>>   130   1414 140491200812800 --> sge_gettext_() {
>>>   131   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>   132   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>   133   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>   134   1414         main --> sge_gdi_ctx_class_error() {
>>>   135   1414         main --> sge_error_verror() {
>>>   136   1414         main     error: reresolve hostname failed: can't 
>>> resolve host name
>>>   137   1414         main <-- sge_error_verror() 
>>> ../libs/uti/sge_error_class.c 293 }
>>>   138   1414         main <-- sge_gdi_ctx_class_error() 
>>> ../libs/gdi/sge_gdi_ctx.c 520 }
>>>   139   1414         main <-- sge_gdi_ctx_class_prepare_enroll() 
>>> ../libs/gdi/sge_gdi_ctx.c 968 }
>>>   140   1414         main --> sge_gdi_ctx_class_prepare_enroll() {
>>>   141   1414         main --> gdi2_reresolve_qualified_hostname() {
>>>   142   1414         main <-- gdi2_reresolve_qualified_hostname() 
>>> ../libs/gdi/sge_gdi_ctx.c 2004 }
>>>   143   1414 140491200812800 --> sge_gettext_() {
>>>   144   1414 140491200812800 --> sge_get_message_id_output_implementation() 
>>> {
>>>   145   1414 140491200812800 <-- sge_get_message_id_output_implementation() 
>>> ../libs/uti/sge_language.c 582 }
>>>   146   1414 140491200812800 <-- sge_gettext_() ../libs/uti/sge_language.c 
>>> 730 }
>>>   147   1414         main --> sge_gdi_ctx_class_error() {
>>>   148   1414         main --> sge_error_verror() {
>>>   149   1414         main     error: reresolve hostname failed: can't 
>>> resolve host name
>>>   150   1414         main <-- sge_error_verror() 
>>> ../libs/uti/sge_error_class.c 293 }
>>>   151   1414         main <-- sge_gdi_ctx_class_error() 
>>> ../libs/gdi/sge_gdi_ctx.c 520 }
>>>   152   1414         main <-- sge_gdi_ctx_class_prepare_enroll() 
>>> ../libs/gdi/sge_gdi_ctx.c 968 }
>>>   153   1414         main --> sge_gdi_ctx_class_prepare_enroll() {
>>>   154   1414         main --> gdi2_reresolve_qualified_hostname() {
>>>   155   1414         main <-- gdi2_reresolve_qualified_hostname() 
>>> ../libs/gdi/sge_gdi_ctx.c 2004 }
>>> 
>>> _______________________________________________
>>> users mailing list
>>> [email protected]
>>> https://gridengine.org/mailman/listinfo/users
> 


_______________________________________________
users mailing list
[email protected]
https://gridengine.org/mailman/listinfo/users

Reply via email to