[pgpool-general: 271] pgpool restart after losing node

Gales Romain Romain.Gales at act.etat.lu
Fri Mar 9 00:15:05 JST 2012


Hi,

 

I am quiet new to pgpool. I am trying an setup with simple streaming. I
followed this howto
http://www.pgpool.net/pgpool-web/contrib_docs/simple_sr_setting2_3.1/index.h
tml.

 

Now when I lose one node all my clients were disconnected.

 

In the pgpool log file I find the following:

 

2012-03-08 15:52:16 LOG:   pid 10884: find_primary_node_repeatedly: waiting
for finding a primary node

2012-03-08 15:52:16 LOG:   pid 10884: find_primary_node: primary node id is
0

2012-03-08 15:52:16 LOG:   pid 10884: failover: set new primary node: 0

2012-03-08 15:52:16 LOG:   pid 10884: failover: set new master node: 0

2012-03-08 15:52:16 LOG:   pid 10884: failback done. reconnect host
test3(5432)

2012-03-08 15:52:16 LOG:   pid 10966: worker process received restart
request

2012-03-08 15:52:16 LOG:   pid 30470: recovery done

2012-03-08 15:52:17 LOG:   pid 10884: worker child 10966 exits with status
256

2012-03-08 15:52:17 LOG:   pid 10884: fork a new worker child pid 30487

2012-03-08 15:52:17 LOG:   pid 30470: pcp child process received restart
request

2012-03-08 15:52:17 LOG:   pid 30438: do_child: failback event found.
restart myself.

...

2012-03-08 15:52:17 LOG:   pid 10884: PCP child 30470 exits with status 256

2012-03-08 15:52:17 LOG:   pid 10884: fork a new PCP child pid 30519

2012-03-08 15:52:17 LOG:   pid 30466: statement: COMMIT

 

 

Is this restart normal?

 

 

My config:

 

# ----------------------------

# pgPool-II configuration file

# ----------------------------

#

# This file consists of lines of the form:

#

#   name = value

#

# Whitespace may be used.  Comments are introduced with "#" anywhere on a
line.

# The complete list of parameter names and allowed values can be found in
the

# pgPool-II documentation.

#

# This file is read on server startup and when the server receives a SIGHUP

# signal.  If you edit the file on a running system, you have to SIGHUP the

# server for the changes to take effect, or use "pgpool reload".  Some

# parameters, which are marked below, require a server shutdown and restart
to

# take effect.

#

 

 

#---------------------------------------------------------------------------
---

# CONNECTIONS

#---------------------------------------------------------------------------
---

 

# - pgpool Connection Settings -

 

listen_addresses = '*'

                                   # Host name or IP address to listen on:

                                   # '*' for all, '' for no TCP/IP
connections

                                   # (change requires restart)

port = 5432

                                   # Port number

                                   # (change requires restart)

socket_dir = '/tmp'

                                   # Unix domain socket path

                                   # The Debian package defaults to

                                   # /var/run/postgresql

                                   # (change requires restart)

 

 

# - pgpool Communication Manager Connection Settings -

 

pcp_port = 9898

                                   # Port number for pcp

                                   # (change requires restart)

pcp_socket_dir = '/tmp'

                                   # Unix domain socket path for pcp

                                   # The Debian package defaults to

                                   # /var/run/postgresql

                                   # (change requires restart)

 

# - Backend Connection Settings -

 

backend_hostname0 = 'test2'

                                   # Host name or IP address to connect to
for backend 0

backend_port0 = 5432

                                   # Port number for backend 0

backend_weight0 = 1

                                   # Weight for backend 0 (only in load
balancing mode)

backend_data_directory0 = '/opt/PostgreSQL/9.1/data/'

                                   # Data directory for backend 0

backend_flag0 = 'ALLOW_TO_FAILOVER'

                                   # Controls various backend behavior

                                   # ALLOW_TO_FAILOVER or
DISALLOW_TO_FAILOVER

backend_hostname1 = 'test3'

backend_port1 = 5432

backend_weight1 = 1

backend_data_directory1 = '/opt/PostgreSQL/9.1/data/'

backend_flag1 = 'ALLOW_TO_FAILOVER'

 

# - Authentication -

 

enable_pool_hba = off

                                   # Use pool_hba.conf for client
authentication

authentication_timeout = 60

                                   # Delay in seconds to complete client
authentication

                                   # 0 means no timeout.

 

# - SSL Connections -

 

ssl = off

                                   # Enable SSL support

                                   # (change requires restart)

#ssl_key = './server.key'

                                   # Path to the SSL private key file

                                   # (change requires restart)

#ssl_cert = './server.cert'

                                   # Path to the SSL public certificate file

                                   # (change requires restart)

#ssl_ca_cert = ''

                                   # Path to a single PEM format file

                                   # containing CA root certificate(s)

                                   # (change requires restart)

#ssl_ca_cert_dir = ''

                                   # Directory containing CA root
certificate(s)

                                   # (change requires restart)

 

 

#---------------------------------------------------------------------------
---

# POOLS

#---------------------------------------------------------------------------
---

 

# - Pool size -

 

num_init_children = 32

                                   # Number of pools

                                   # (change requires restart)

max_pool = 4

                                   # Number of connections per pool

                                   # (change requires restart)

 

# - Life time -

 

child_life_time = 300

                                   # Pool exits after being idle for this
many seconds

child_max_connections = 0

                                   # Pool exits after receiving that many
connections

                                   # 0 means no exit

connection_life_time = 0

                                   # Connection to backend closes after
being idle for this many seconds

                                   # 0 means no close

client_idle_limit = 0

                                   # Client is disconnected after being idle
for that many seconds

                                   # (even inside an explicit transactions!)

                                   # 0 means no disconnection

 

 

#---------------------------------------------------------------------------
---

# LOGS

#---------------------------------------------------------------------------
---

 

# - Where to log -

 

log_destination = 'stderr'

                                   # Where to log

                                   # Valid values are combinations of
stderr,

                                   # and syslog. Default to stderr.

 

# - What to log -

 

print_timestamp = on

                                   # Print timestamp on each line

                                   # (change requires restart)

 

log_connections = on

                                   # Log connections

log_hostname = on

                                   # Hostname will be shown in ps status

                                   # and in logs if connections are logged

log_statement = on

                                   # Log all statements

log_per_node_statement = on

                                   # Log all statements

                                   # with node and backend informations

log_standby_delay = 'if_over_threshold'

                                   # Log standby delay

                                   # Valid values are combinations of
always,

                                   # if_over_threshold, none

 

# - Syslog specific -

 

syslog_facility = 'LOCAL0'

                                   # Syslog local facility. Default to
LOCAL0

syslog_ident = 'pgpool'

                                   # Syslog program identification string

                                   # Default to 'pgpool'

 

# - Debug -

 

debug_level = 0

                                   # Debug message verbosity level

                                   # 0 means no message, 1 or more mean
verbose

 

 

#---------------------------------------------------------------------------
---

# FILE LOCATIONS

#---------------------------------------------------------------------------
---

 

pid_file_name = '/var/run/pgpool/pgpool.pid'

                                   # PID file name

                                   # (change requires restart)

logdir = '/var/log/pgpool'

                                   # Directory of pgPool status file

                                   # (change requires restart)

 

 

#---------------------------------------------------------------------------
---

# CONNECTION POOLING

#---------------------------------------------------------------------------
---

 

connection_cache = on

                                   # Activate connection pools

                                   # (change requires restart)

 

                                   # Semicolon separated list of queries

                                   # to be issued at the end of a session

                                   # The default is for 8.3 and later

reset_query_list = 'ABORT; DISCARD ALL'

                                   # The following one is for 8.2 and before

#reset_query_list = 'ABORT; RESET ALL; SET SESSION AUTHORIZATION DEFAULT'

 

 

#---------------------------------------------------------------------------
---

# REPLICATION MODE

#---------------------------------------------------------------------------
---

 

replication_mode = off

                                   # Activate replication mode

                                   # (change requires restart)

replicate_select = off

                                   # Replicate SELECT statements

                                   # when in replication or parallel mode

                                   # replicate_select is higher priority
than

                                   # load_balance_mode.

 

insert_lock = off

                                   # Automatically locks a dummy row or a
table

                                   # with INSERT statements to keep SERIAL
data

                                   # consistency

                                   # Without SERIAL, no lock will be issued

lobj_lock_table = ''

                                   # When rewriting lo_creat command in

                                   # replication mode, specify table name to

                                   # lock

 

# - Degenerate handling -

 

replication_stop_on_mismatch = off

                                   # On disagreement with the packet kind

                                   # sent from backend, degenerate the node

                                   # which is most likely "minority"

                                   # If off, just force to exit this session

 

failover_if_affected_tuples_mismatch = off

                                   # On disagreement with the number of
affected

                                   # tuples in UPDATE/DELETE queries, then

                                   # degenerate the node which is most
likely

                                   # "minority".

                                   # If off, just abort the transaction to

                                   # keep the consistency

 

 

#---------------------------------------------------------------------------
---

# LOAD BALANCING MODE

#---------------------------------------------------------------------------
---

 

load_balance_mode = on

                                   # Activate load balancing mode

                                   # (change requires restart)

ignore_leading_white_space = on

                                   # Ignore leading white spaces of each
query

white_function_list = ''

                                   # Comma separated list of function names

                                   # that don't write to database

                                   # Regexp are accepted

black_function_list = 'currval,lastval,nextval,setval'

                                   # Comma separated list of function names

                                   # that write to database

                                   # Regexp are accepted

 

 

#---------------------------------------------------------------------------
---

# MASTER/SLAVE MODE

#---------------------------------------------------------------------------
---

 

master_slave_mode = on

                                   # Activate master/slave mode

                                   # (change requires restart)

master_slave_sub_mode = 'stream'

                                   # Master/slave sub mode

                                   # Valid values are combinations slony or

                                   # stream. Default is slony.

                                   # (change requires restart)

 

# - Streaming -

 

sr_check_period = 10

                                   # Streaming replication check period

                                   # Disabled (0) by default

sr_check_user = 'postgres'

                                   # Streaming replication check user

                                   # This is neccessary even if you disable
streaming

                                   # replication delay check by
sr_check_period = 0

sr_check_password = ''

                                   # Password for streaming replication
check user

delay_threshold = 10000000

                                   # Threshold before not dispatching query
to standby node

                                   # Unit is in bytes

                                   # Disabled (0) by default

 

# - Special commands -

 

follow_master_command = ''

                                   # Executes this command after master
failover

                                   # Special values:

                                   #   %d = node id

                                   #   %h = host name

                                   #   %p = port number

                                   #   %D = database cluster path

                                   #   %m = new master node id

                                   #   %H = hostname of the new master node

                                   #   %M = old master node id

                                   #   %P = old primary node id

                                   #   %% = '%' character

 

 

#---------------------------------------------------------------------------
---

# PARALLEL MODE AND QUERY CACHE

#---------------------------------------------------------------------------
---

 

parallel_mode = off

                                   # Activates parallel query mode

                                   # (change requires restart)

enable_query_cache = off

                                   # Activates query cache

                                   # (change requires restart)

 

pgpool2_hostname = ''

                                   # Set pgpool2 hostname

                                   # (change requires restart)

 

# - System DB info -

 

system_db_hostname  = 'localhost'

                                   # (change requires restart)

system_db_port = 5432

                                   # (change requires restart)

system_db_dbname = 'pgpool'

                                   # (change requires restart)

system_db_schema = 'pgpool_catalog'

                                   # (change requires restart)

system_db_user = 'pgpool'

                                   # (change requires restart)

system_db_password = ''

                                   # (change requires restart)

 

 

#---------------------------------------------------------------------------
---

# HEALTH CHECK

#---------------------------------------------------------------------------
---

 

health_check_period = 10

                                   # Health check period

                                   # Disabled (0) by default

health_check_timeout = 20

                                   # Health check timeout

                                   # 0 means no timeout

health_check_user = 'postgres'

                                  # Health check user

health_check_password = ''

                                   # Password for health check user

 

 

#---------------------------------------------------------------------------
---

# FAILOVER AND FAILBACK

#---------------------------------------------------------------------------
---

 

failover_command = '/etc/failover.sh %d "%h" %p %D %m %M "%H" %P'

                                   # Executes this command at failover

                                   # Special values:

                                   #   %d = node id

                                   #   %h = host name

                                   #   %p = port number

                                   #   %D = database cluster path

                                   #   %m = new master node id

                                   #   %H = hostname of the new master node

                                   #   %M = old master node id

                                   #   %P = old primary node id

                                   #   %% = '%' character

failback_command = '/bin/rm -f /var/log/pgpool/trigger/trigger_file1'

                                   # Executes this command at failback.

                                   # Special values:

                                   #   %d = node id

                                   #   %h = host name

                                   #   %p = port number

                                   #   %D = database cluster path

                                   #   %m = new master node id

                                   #   %H = hostname of the new master node

                                   #   %M = old master node id

                                   #   %P = old primary node id

                                   #   %% = '%' character

 

fail_over_on_backend_error = on

                                   # Initiates failover when writing to the

                                   # backend communication socket fails

                                   # This is the same behaviour of pgpool-II

                                   # 2.2.x and previous releases

                                   # If set to off, pgpool will report an

                                   # error and disconnect the session.

 

 

#---------------------------------------------------------------------------
---

# ONLINE RECOVERY

#---------------------------------------------------------------------------
---

 

recovery_user = 'postgres'

                                   # Online recovery user

recovery_password = ''

                                   # Online recovery password

recovery_1st_stage_command = 'basebackup.sh'

                                   # Executes a command in first stage

recovery_2nd_stage_command = ''

                                   # Executes a command in second stage

recovery_timeout = 90

                                   # Timeout in seconds to wait for the

                                   # recovering node's postmaster to start
up

                                   # 0 means no wait

client_idle_limit_in_recovery = 0

                                   # Client is disconnected after being idle

                                   # for that many seconds in the second
stage

                                   # of online recovery

                                   # 0 means no disconnection

                                   # -1 means immediate disconnection

 

 

#---------------------------------------------------------------------------
---

# OTHERS

#---------------------------------------------------------------------------
---

 

relcache_expire = 0

                                   # Life time of relation cache in seconds.

                                   # 0 means no cache expiration(the
default).

                                   # The relation cache is used for cache
the

                                   # query result against PostgreSQL system

                                   # catalog to obtain various information

                                   # including table structures or if it's a

                                   # temporary table or not. The cache is

                                   # maintained in a pgpool child local
memory

                                   # and being kept as long as it survives.

                                   # If someone modify the table by using

                                   # ALTER TABLE or some such, the relcache
is

                                   # not consistent anymore.

                                   # For this purpose, cache_expiration

                                   # controls the life time of the cache.

 

 






Gales Romain 

service informatique


e-mail:  <mailto:romain.gales at act.etat.lu> romain.gales at act.etat.lu

Tel: +352 44901-250


 <http://www.act.public.lu> http://www.act.public.lu 


Description: logo

 

-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://www.sraoss.jp/pipermail/pgpool-general/attachments/20120308/b72a8fc7/attachment-0001.html>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: image001.jpg
Type: image/jpeg
Size: 31368 bytes
Desc: not available
URL: <http://www.sraoss.jp/pipermail/pgpool-general/attachments/20120308/b72a8fc7/attachment-0001.jpg>


More information about the pgpool-general mailing list