"barman.backup ERROR: Backup failed issuing stop backup command". No other info in barman logs.
I can see pg_start_backup() in the postgres logs but nothing around pg_stop_backup(), no exceptions in the postgres logs. Nothing in the system logs. Running pg_stop_backup works fine when I run it on the master or via ssh (ssh postgres@server0011 'psql -U postgres -c "select pg_stop_backup()" site').
This started happening after kernels were updated last week, barman was also updated to 2.0, but we have rolled back barman; issue persists. Has anyone experienced similar issues?
{
"global": {
"config": {
"barman_home": "/var/lib/barman",
"barman_user": "barman",
"compression": "gzip",
"errors_list": [],
"log_file": "/var/log/barman/barman.log",
"post_backup_script": "/var/lib/barman/script/post_backup.sh",
"pre_archive_script": "/var/lib/barman/script/pre_backup.sh"
},
"system_info": {
"barman_ver": "1.6.1",
"kernel_ver": "Linux server0013 2.6.32-642.6.2.el6.x86_64 #1 SMP Wed Oct 26 06:52:09 UTC 2016 x86_64 x86_64 x86_64 GNU/Linux",
"python_ver": "Python 2.6.6",
"release": "RedHat Linux CentOS release 6.8 (Final)",
"rsync_ver": "rsync version 3.0.6 protocol version 30",
"ssh_ver": "OpenSSH_5.3p1, OpenSSL 1.0.1e-fips 11 Feb 2013"
}
},
"servers": {
"main-11": {
"backups": {
"20161021T010001": {
"backup_id": "20161021T010001",
"backup_label": null,
"begin_offset": 40,
"begin_time": "Fri Oct 21 01:00:01 2016",
"begin_wal": "000000010000016400000023",
"begin_xlog": "164/23000028",
"config_file": "/data/pgsql/9.4/data/postgresql.conf",
"deduplicated_size": 125719834313,
"end_offset": 12717560,
"end_time": "Fri Oct 21 09:11:18 2016",
"end_wal": "00000001000001640000005E",
"end_xlog": "164/5EC20DF8",
"error": null,
"hba_file": "/data/pgsql/9.4/data/pg_hba.conf",
"ident_file": "/data/pgsql/9.4/data/pg_ident.conf",
"included_files": null,
"mode": "default",
"pgdata": "/data/pgsql/9.4/data",
"server_name": "main-11",
"size": 125719834313,
"status": "DONE",
"tablespaces": null,
"timeline": 1,
"version": 90401
},
"20161028T010001": {
"backup_id": "20161028T010001",
"backup_label": null,
"begin_offset": 40,
"begin_time": "Fri Oct 28 01:00:01 2016",
"begin_wal": "000000010000016700000075",
"begin_xlog": "167/75000028",
"config_file": "/data/pgsql/9.4/data/postgresql.conf",
"deduplicated_size": 126414384841,
"end_offset": 3989304,
"end_time": "Fri Oct 28 08:59:23 2016",
"end_wal": "00000001000001670000007E",
"end_xlog": "167/7E3CDF38",
"error": null,
"hba_file": "/data/pgsql/9.4/data/pg_hba.conf",
"ident_file": "/data/pgsql/9.4/data/pg_ident.conf",
"included_files": null,
"mode": "default",
"pgdata": "/data/pgsql/9.4/data",
"server_name": "main-11",
"size": 126414384841,
"status": "DONE",
"tablespaces": null,
"timeline": 1,
"version": 90401
},
"20161104T010001": {
"backup_id": "20161104T010001",
"backup_label": null,
"begin_offset": 40,
"begin_time": "Fri Nov 4 01:00:01 2016",
"begin_wal": "0000000100000170000000CD",
"begin_xlog": "170/CD000028",
"config_file": "/data/pgsql/9.4/data/postgresql.conf",
"deduplicated_size": 127901814473,
"end_offset": 104840,
"end_time": "Fri Nov 4 09:18:06 2016",
"end_wal": "000000010000017100000020",
"end_xlog": "171/20019988",
"error": null,
"hba_file": "/data/pgsql/9.4/data/pg_hba.conf",
"ident_file": "/data/pgsql/9.4/data/pg_ident.conf",
"included_files": null,
"mode": "default",
"pgdata": "/data/pgsql/9.4/data",
"server_name": "main-11",
"size": 127901814473,
"status": "DONE",
"tablespaces": null,
"timeline": 1,
"version": 90401
},
"20161114T090943": {
"backup_id": "20161114T090943",
"backup_label": null,
"begin_offset": 713504,
"begin_time": "Mon Nov 14 09:09:43 2016",
"begin_wal": "000000010000017E00000093",
"begin_xlog": "17E/930AE320",
"config_file": "/data/pgsql/9.4/data/postgresql.conf",
"deduplicated_size": null,
"end_offset": null,
"end_time": null,
"end_wal": null,
"end_xlog": null,
"error": "failure issuing stop backup command (Cannot terminate exclusive backup. You might have to manually execute pg_stop_backup() on your PostgreSQL server)",
"hba_file": "/data/pgsql/9.4/data/pg_hba.conf",
"ident_file": "/data/pgsql/9.4/data/pg_ident.conf",
"included_files": null,
"mode": "default",
"pgdata": "/data/pgsql/9.4/data",
"server_name": "main-11",
"size": null,
"status": "FAILED",
"tablespaces": null,
"timeline": 1,
"version": 90410
}
},
"config": {
"active": true,
"archiver": true,
"backup_directory": "/var/lib/barman/main-11",
"backup_method": "rsync",
"backup_options": "exclusive_backup",
"bandwidth_limit": null,
"barman_home": "/var/lib/barman",
"barman_lock_directory": "/var/lib/barman",
"basebackup_retry_sleep": 30,
"basebackup_retry_times": 0,
"basebackups_directory": "/var/lib/barman/main-11/base",
"compression": "gzip",
"conninfo": "host=server0011 user=postgres",
"custom_compression_filter": null,
"custom_decompression_filter": null,
"description": "Production DB on server0011 (MAIN-11)",
"disabled": false,
"errors_directory": "/var/lib/barman/main-11/errors",
"immediate_checkpoint": false,
"incoming_wals_directory": "/var/lib/barman/main-11/incoming",
"last_backup_maximum_age": "7 days",
"minimum_redundancy": 1,
"msg_list": [],
"name": "main-11",
"network_compression": false,
"path_prefix": null,
"post_archive_retry_script": null,
"post_archive_script": null,
"post_backup_retry_script": null,
"post_backup_script": "/var/lib/barman/script/post_backup.sh",
"pre_archive_retry_script": null,
"pre_archive_script": "/var/lib/barman/script/pre_backup.sh",
"pre_backup_retry_script": null,
"pre_backup_script": null,
"recovery_options": "",
"retention_policy": "window 3 w",
"retention_policy_mode": "auto",
"reuse_backup": null,
"ssh_command": "ssh postgres@server0011",
"streaming_archiver": false,
"streaming_archiver_name": "barman_receive_wal",
"streaming_conninfo": "host=server0011 user=postgres",
"streaming_wals_directory": "/var/lib/barman/main-11/streaming",
"tablespace_bandwidth_limit": null,
"wal_retention_policy": "simple-wal 3 w",
"wals_directory": "/var/lib/barman/main-11/wals"
},
"status": {
"archive_command": "rsync -a %p barman@server0013:/var/lib/barman/main-11/incoming/%f",
"archive_mode": "on",
"archived_count": 98568,
"config_file": "/data/pgsql/9.4/data/postgresql.conf",
"current_archived_wals_per_second": 0.0025753396900802402,
"current_size": 130283934320.0,
"current_xlog": "0000000100000180000000C5",
"data_directory": "/data/pgsql/9.4/data",
"failed_count": 1,
"hba_file": "/data/pgsql/9.4/data/pg_hba.conf",
"ident_file": "/data/pgsql/9.4/data/pg_ident.conf",
"is_archiving": true,
"is_superuser": true,
"last_archived_time": "Tue Nov 15 09:14:42 2016",
"last_archived_wal": "0000000100000180000000C4",
"last_failed_time": "Wed Oct 5 17:36:30 2016",
"last_failed_wal": "000000010000014C00000016",
"pgespresso_installed": false,
"server_txt_version": "9.4.10",
"stats_reset": "Fri Aug 28 15:38:44 2015",
"wal_level": "hot_standby"
},
"system_info": {
"kernel_ver": "Linux server0011 2.6.32-642.6.2.el6.x86_64 #1 SMP Wed Oct 26 06:52:09 UTC 2016 x86_64 x86_64 x86_64 GNU/Linux",
"python_ver": "Python 2.6.6",
"release": "RedHat Linux CentOS release 6.8 (Final)",
"rsync_ver": "rsync version 3.0.6 protocol version 30",
"ssh_ver": "OpenSSH_5.3p1, OpenSSL 1.0.1e-fips 11 Feb 2013"
}
}
}
}