1148 lines
44 KiB
C
1148 lines
44 KiB
C
/****************************************************************
|
|
* *
|
|
* Copyright 2003, 2012 Fidelity Information Services, Inc *
|
|
* *
|
|
* This source code contains the intellectual property *
|
|
* of its copyright holder(s), and is made available *
|
|
* under a license. If you do not know the terms of *
|
|
* the license, please stop and do not read further. *
|
|
* *
|
|
****************************************************************/
|
|
|
|
#include "mdef.h"
|
|
|
|
#include "gtm_string.h"
|
|
#include "gtm_stdlib.h"
|
|
#include "min_max.h"
|
|
#include "cli.h"
|
|
#include "gdsroot.h"
|
|
#include "gdsbt.h"
|
|
#include "gtm_facility.h"
|
|
#include "fileinfo.h"
|
|
#include "gdsblk.h"
|
|
#include "gdsfhead.h"
|
|
#include "gdscc.h" /* needed for tp.h */
|
|
#include "gdskill.h" /* needed for tp.h */
|
|
#include "filestruct.h"
|
|
#include "jnl.h"
|
|
#include "buddy_list.h"
|
|
#include "hashtab_int4.h" /* needed for muprec.h */
|
|
#include "hashtab_int8.h" /* needed for muprec.h */
|
|
#include "hashtab_mname.h" /* needed for muprec.h */
|
|
#include "hashtab.h"
|
|
#include "muprec.h"
|
|
#include "io.h"
|
|
#include "iosp.h"
|
|
#include "dpgbldir.h"
|
|
#include "have_crit.h"
|
|
#include "repl_sem.h"
|
|
#ifdef UNIX
|
|
#include "ftok_sems.h"
|
|
#include "repl_instance.h"
|
|
#include "mu_rndwn_repl_instance.h"
|
|
#include "deferred_signal_handler.h"
|
|
#elif defined(VMS)
|
|
#include <descrip.h>
|
|
#include "gtm_inet.h"
|
|
#include "iosb_disk.h" /* For mur_read_file.h */
|
|
#include "dpgbldir_sysops.h"
|
|
#include "gbldirnam.h"
|
|
#include "gtmrecv.h"
|
|
#endif
|
|
#include "mu_rndwn_file.h"
|
|
#include "read_db_files_from_gld.h"
|
|
#include "mur_db_files_from_jnllist.h"
|
|
#include "gtm_rename.h"
|
|
#include "gtmmsg.h"
|
|
#include "file_head_read.h"
|
|
#include "mupip_exit.h"
|
|
#include "mu_gv_cur_reg_init.h"
|
|
#include "dbfilop.h"
|
|
#include "mur_read_file.h" /* for "mur_fread_eof" prototype */
|
|
#include "tp_change_reg.h"
|
|
#include "gds_rundown.h"
|
|
#include "is_file_identical.h"
|
|
#include "repl_msg.h"
|
|
#include "gtmsource.h"
|
|
#include "mu_rndwn_replpool.h"
|
|
#include "gtm_logicals.h"
|
|
#ifdef UNIX
|
|
#include <sys/sem.h>
|
|
#include "tp.h" /* for "insert_region" prototype */
|
|
#include "gtm_time.h"
|
|
#include "interlock.h"
|
|
#include "eintr_wrapper_semop.h"
|
|
#include "gtm_semutils.h"
|
|
#include "sleep_cnt.h"
|
|
#include "gdsbgtr.h"
|
|
#include "heartbeat_timer.h"
|
|
#include "gtmsource_srv_latch.h"
|
|
#include "do_semop.h"
|
|
#include "wcs_sleep.h"
|
|
#include "wcs_flu.h"
|
|
#include "wcs_recover.h"
|
|
#include "is_proc_alive.h"
|
|
#include "anticipatory_freeze.h"
|
|
|
|
#define RELEASE_ACCESS_CONTROL(REGLIST) \
|
|
{ \
|
|
unix_db_info *lcl_udi; \
|
|
gd_region *lcl_reg; \
|
|
reg_ctl_list *lcl_rctl; \
|
|
int save_errno; \
|
|
\
|
|
lcl_reg = REGLIST->reg; \
|
|
lcl_rctl = REGLIST->rctl; \
|
|
lcl_udi = FILE_INFO(lcl_reg); \
|
|
assert(INVALID_SEMID != lcl_udi->semid); \
|
|
assert(lcl_udi->grabbed_access_sem && lcl_rctl->standalone); \
|
|
if (0 != (save_errno = do_semop(lcl_udi->semid, 0, -1, SEM_UNDO))) \
|
|
{ \
|
|
assert(FALSE); /* we hold it, so we should be able to release it*/ \
|
|
rts_error(VARLSTCNT(12) ERR_CRITSEMFAIL, 2, DB_LEN_STR(lcl_reg), ERR_SYSCALL, 5,\
|
|
RTS_ERROR_LITERAL("semop()"), CALLFROM, save_errno); \
|
|
} \
|
|
lcl_udi->grabbed_access_sem = FALSE; \
|
|
lcl_rctl->standalone = FALSE; \
|
|
}
|
|
|
|
#define GRAB_ACCESS_CONTROL(REGLIST) \
|
|
{ \
|
|
unix_db_info *lcl_udi; \
|
|
gd_region *lcl_reg; \
|
|
reg_ctl_list *lcl_rctl; \
|
|
int save_errno, sopcnt, status; \
|
|
struct sembuf sop[3]; \
|
|
\
|
|
SET_GTM_SOP_ARRAY(sop, sopcnt, FALSE, SEM_UNDO); \
|
|
assert(2 == sopcnt); \
|
|
lcl_reg = REGLIST->reg; \
|
|
lcl_rctl = REGLIST->rctl; \
|
|
lcl_udi = FILE_INFO(lcl_reg); \
|
|
assert(INVALID_SEMID != lcl_udi->semid); \
|
|
if (lcl_udi->grabbed_access_sem) \
|
|
assert(lcl_rctl->standalone); \
|
|
else \
|
|
{ \
|
|
SEMOP(lcl_udi->semid, sop, sopcnt, status, NO_WAIT); \
|
|
if (0 != status) \
|
|
{ \
|
|
save_errno = errno; \
|
|
assert(FALSE); \
|
|
rts_error(VARLSTCNT(12) ERR_CRITSEMFAIL, 2, DB_LEN_STR(lcl_reg), ERR_SYSCALL, 5,\
|
|
RTS_ERROR_LITERAL("semop()"), CALLFROM, save_errno); \
|
|
} \
|
|
lcl_udi->grabbed_access_sem = TRUE; \
|
|
lcl_rctl->standalone = TRUE; \
|
|
} \
|
|
}
|
|
#endif
|
|
|
|
GBLREF boolean_t blocksig_initialized;
|
|
GBLREF sigset_t block_sigsent;
|
|
GBLREF reg_ctl_list *mur_ctl;
|
|
GBLREF mur_opt_struct mur_options;
|
|
GBLREF mur_gbls_t murgbl;
|
|
GBLREF gd_region *gv_cur_region;
|
|
GBLREF jnlpool_addrs jnlpool;
|
|
GBLREF gd_addr *gd_header;
|
|
#ifdef UNIX
|
|
GBLREF jnlpool_ctl_ptr_t jnlpool_ctl;
|
|
GBLREF sgmnt_addrs *cs_addrs;
|
|
GBLREF boolean_t holds_sem[NUM_SEM_SETS][NUM_SRC_SEMS];
|
|
GBLREF int4 strm_index;
|
|
GBLREF uint4 process_id;
|
|
GBLREF jnl_gbls_t jgbl;
|
|
GBLREF sgmnt_data *cs_data;
|
|
GBLREF boolean_t jnlpool_init_needed;
|
|
#endif
|
|
|
|
|
|
#if defined(VMS)
|
|
error_def (ERR_MUJPOOLRNDWNFL);
|
|
error_def (ERR_MUJPOOLRNDWNSUC);
|
|
error_def (ERR_MURPOOLRNDWNFL);
|
|
error_def (ERR_MURPOOLRNDWNSUC);
|
|
#elif defined(UNIX)
|
|
error_def (ERR_JNLFILEOPNERR);
|
|
error_def (ERR_SYSCALL);
|
|
#endif
|
|
error_def (ERR_CRITSEMFAIL);
|
|
error_def (ERR_DBFILOPERR);
|
|
error_def (ERR_DBFRZRESETFL);
|
|
error_def (ERR_DBFRZRESETSUC);
|
|
error_def (ERR_DBJNLNOTMATCH);
|
|
error_def (ERR_DBRDONLY);
|
|
error_def (ERR_FILENOTFND);
|
|
error_def (ERR_FILEPARSE);
|
|
error_def (ERR_JNLBADRECFMT);
|
|
error_def (ERR_JNLDBTNNOMATCH);
|
|
error_def (ERR_JNLFILEDUP);
|
|
error_def (ERR_JNLNMBKNOTPRCD);
|
|
error_def (ERR_JNLSTATEOFF);
|
|
error_def (ERR_JNLTNOUTOFSEQ);
|
|
error_def (ERR_MUKILLIP);
|
|
error_def (ERR_MUPCLIERR);
|
|
error_def (ERR_MUPJNLINTERRUPT);
|
|
error_def (ERR_MUSTANDALONE);
|
|
error_def (ERR_NOPREVLINK);
|
|
error_def (ERR_NOSTARFILE);
|
|
error_def (ERR_NOTALLJNLEN);
|
|
error_def (ERR_NOTALLREPLON);
|
|
error_def (ERR_ORLBKFRZOVER);
|
|
error_def (ERR_ORLBKFRZPROG);
|
|
error_def (ERR_ORLBKNOV4BLK);
|
|
error_def (ERR_ORLBKSTART);
|
|
error_def (ERR_REPLSTATEOFF);
|
|
error_def (ERR_RLBKNOBIMG);
|
|
error_def (ERR_ROLLBKINTERRUPT);
|
|
error_def (ERR_SRVLCKWT2LNG);
|
|
error_def (ERR_STARFILE);
|
|
error_def (ERR_TEXT);
|
|
error_def (ERR_WCBLOCKED);
|
|
|
|
#define STAR_QUOTE "\"*\""
|
|
boolean_t mur_open_files()
|
|
{
|
|
boolean_t interrupted_rollback;
|
|
int jnl_total, jnlno, regno, max_reg_total;
|
|
unsigned int full_len;
|
|
unsigned short jnl_file_list_len; /* cli_get_str requires a short */
|
|
char jnl_file_list[MAX_LINE];
|
|
char *cptr, *cptr_last, *ctop;
|
|
jnl_ctl_list *jctl, *temp_jctl;
|
|
reg_ctl_list *rctl, *rctl_top, tmp_rctl;
|
|
gld_dbname_list *gld_db_files, *curr;
|
|
boolean_t star_specified, outofsync;
|
|
redirect_list *rl_ptr;
|
|
replpool_identifier replpool_id;
|
|
sgmnt_data_ptr_t csd;
|
|
sgmnt_addrs *csa;
|
|
file_control *fc;
|
|
freeze_status reg_frz_status;
|
|
# if defined(VMS)
|
|
uint4 status;
|
|
boolean_t sgmnt_found;
|
|
mstr gbldir_mstr, *tran_name;
|
|
gds_file_id file_id;
|
|
struct dsc$descriptor_s name_dsc;
|
|
char res_name[MAX_NAME_LEN + 2];/* +1 for the terminating null and
|
|
another +1 for the length stored in [0] by global_name() */
|
|
# else /* ONLINE ROLLBACK specific variables */
|
|
onln_rlbk_reg_list *reglist = NULL, *rl, *rl_last, *save_rl, *rl_new;
|
|
boolean_t x_lock, wait_for_kip, replinst_file_corrupt = FALSE, inst_requires_rlbk;
|
|
boolean_t jnlpool_sem_created;
|
|
sgmnt_addrs *tmpcsa;
|
|
sgmnt_data *tmpcsd;
|
|
gd_region *reg;
|
|
int4 llcnt, max_epoch_interval = 0, idx;
|
|
unix_db_info *udi;
|
|
now_t now;
|
|
char *time_ptr, time_str[CTIME_BEFORE_NL + 2]; /* for GET_CUR_TIME macro */
|
|
const char *verbose_ptr;
|
|
gtmsource_local_ptr_t gtmsourcelocal_ptr;
|
|
DEBUG_ONLY(int semval;)
|
|
DEBUG_ONLY(jnl_buffer_ptr_t jb;)
|
|
# endif
|
|
DCL_THREADGBL_ACCESS;
|
|
|
|
SETUP_THREADGBL_ACCESS;
|
|
UNIX_ONLY(jnlpool_init_needed = !mur_options.update);
|
|
jnl_file_list_len = MAX_LINE;
|
|
if (FALSE == CLI_GET_STR_ALL("FILE", jnl_file_list, &jnl_file_list_len))
|
|
mupip_exit(ERR_MUPCLIERR);
|
|
if ((1 == jnl_file_list_len && '*' == jnl_file_list[0]) ||
|
|
(STR_LIT_LEN(STAR_QUOTE) == jnl_file_list_len &&
|
|
0 == memcmp(jnl_file_list, STAR_QUOTE, STR_LIT_LEN(STAR_QUOTE))))
|
|
{
|
|
star_specified = TRUE;
|
|
if (NULL != mur_options.redirect)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_STARFILE, 2, LEN_AND_LIT("REDIRECT qualifier"));
|
|
mupip_exit(ERR_MUPCLIERR);
|
|
}
|
|
} else
|
|
{
|
|
star_specified = FALSE;
|
|
if (mur_options.rollback)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_NOSTARFILE, 2, LEN_AND_LIT("ROLLBACK qualifier"));
|
|
mupip_exit(ERR_MUPCLIERR);
|
|
}
|
|
}
|
|
/* We assume recovery will be done only on current global directory.
|
|
* That is, journal file names specified must be from current global directory.
|
|
*/
|
|
if (star_specified || mur_options.update && !mur_options.redirect)
|
|
{ /* "*" is specified or it is -recover or -rollback. We require gtmgbldir to be set in all these cases.
|
|
* The only exception is "-redirect" in which case the target database is obtained from -redirect
|
|
* instead of from the global directory.
|
|
*/
|
|
assert(NULL == gd_header);
|
|
gvinit(); /* read in current global directory */
|
|
assert(NULL != gd_header);
|
|
}
|
|
if (star_specified)
|
|
{
|
|
max_reg_total = gd_header->n_regions;
|
|
gld_db_files = read_db_files_from_gld(gd_header);
|
|
} else
|
|
gld_db_files = mur_db_files_from_jnllist(jnl_file_list, jnl_file_list_len, &max_reg_total);
|
|
if (NULL == gld_db_files)
|
|
return FALSE;
|
|
mur_ctl = (reg_ctl_list *)malloc(SIZEOF(reg_ctl_list) * max_reg_total);
|
|
memset(mur_ctl, 0, SIZEOF(reg_ctl_list) * max_reg_total);
|
|
curr = gld_db_files;
|
|
murgbl.max_extr_record_length = DEFAULT_EXTR_BUFSIZE;
|
|
murgbl.repl_standalone = FALSE;
|
|
if (mur_options.rollback)
|
|
{ /* Rundown the Jnlpool and Recvpool */
|
|
# if defined(UNIX)
|
|
if (!repl_inst_get_name((char *)replpool_id.instfilename, &full_len, SIZEOF(replpool_id.instfilename),
|
|
issue_gtm_putmsg))
|
|
{ /* appropriate gtm_putmsg would have already been issued by repl_inst_get_name */
|
|
return FALSE;
|
|
}
|
|
assert(NUM_SRC_SEMS == NUM_RECV_SEMS);
|
|
ASSERT_DONOT_HOLD_REPLPOOL_SEMS;
|
|
assert(NULL == jnlpool.repl_inst_filehdr);
|
|
UNIX_ONLY(if (!mu_rndwn_repl_instance(&replpool_id, FALSE, TRUE, &jnlpool_sem_created)))
|
|
VMS_ONLY(if (!mu_rndwn_repl_instance(&replpool_id, FALSE, TRUE)))
|
|
return FALSE; /* mu_rndwn_repl_instance will have printed appropriate message in case of error */
|
|
assert(jnlpool.jnlpool_ctl == jnlpool_ctl);
|
|
assert(jgbl.onlnrlbk || ANTICIPATORY_FREEZE_AVAILABLE || (NULL == jnlpool_ctl));
|
|
ASSERT_HOLD_REPLPOOL_SEMS;
|
|
assert(NULL != jnlpool.repl_inst_filehdr);
|
|
assert(INVALID_SEMID != jnlpool.repl_inst_filehdr->jnlpool_semid);
|
|
assert(INVALID_SEMID != jnlpool.repl_inst_filehdr->recvpool_semid);
|
|
murgbl.repl_standalone = TRUE;
|
|
/* Since rollback would not have necessarily done a jnlpool_init, it might not have initialized strm_index
|
|
* to the correct value in case of a supplementary instance. So do it now. This code is similar to that in
|
|
* jnlpool_init. Keep the two in sync (i.e. fix the other similarly if one changes).
|
|
*/
|
|
if (jnlpool.repl_inst_filehdr->is_supplementary)
|
|
{
|
|
assert((INVALID_SUPPL_STRM == strm_index) || (0 == strm_index));
|
|
strm_index = 0;
|
|
}
|
|
# elif defined(VMS)
|
|
gbldir_mstr.addr = GTM_GBLDIR;
|
|
gbldir_mstr.len = SIZEOF(GTM_GBLDIR) - 1;
|
|
tran_name = get_name(&gbldir_mstr);
|
|
memcpy(replpool_id.gtmgbldir, tran_name->addr, tran_name->len);
|
|
full_len = tran_name->len;
|
|
if (!get_full_path(replpool_id.gtmgbldir, tran_name->len,
|
|
replpool_id.gtmgbldir, &full_len, MAX_TRANS_NAME_LEN, &status))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_FILENOTFND, 2, tran_name->len, tran_name->addr);
|
|
return FALSE;
|
|
}
|
|
else
|
|
{
|
|
tran_name->len = full_len; /* since on vax, mstr.len is a 'short' */
|
|
set_gdid_from_file((gd_id_ptr_t)&file_id, replpool_id.gtmgbldir, tran_name->len);
|
|
global_name("GT$P", &file_id, res_name); /* P - Stands for Journal Pool */
|
|
res_name[res_name[0] + 1] = '\0';
|
|
STRCPY(replpool_id.repl_pool_key, &res_name[1]);
|
|
replpool_id.pool_type = JNLPOOL_SEGMENT;
|
|
sgmnt_found = FALSE;
|
|
if (mu_rndwn_replpool(&replpool_id, FALSE, &sgmnt_found) && sgmnt_found)
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUJPOOLRNDWNSUC, 4, res_name[0], &res_name[1],
|
|
tran_name->len, replpool_id.gtmgbldir);
|
|
else if (sgmnt_found)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUJPOOLRNDWNFL, 4, res_name[0], &res_name[1],
|
|
tran_name->len, replpool_id.gtmgbldir);
|
|
return FALSE;
|
|
}
|
|
global_name("GT$R", &file_id, res_name); /* R - Stands for Recv Pool */
|
|
res_name[res_name[0] + 1] = '\0';
|
|
STRCPY(replpool_id.repl_pool_key, &res_name[1]);
|
|
replpool_id.pool_type = RECVPOOL_SEGMENT;
|
|
sgmnt_found = FALSE;
|
|
if (mu_rndwn_replpool(&replpool_id, FALSE, &sgmnt_found) && sgmnt_found)
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MURPOOLRNDWNSUC, 4, res_name[0], &res_name[1],
|
|
tran_name->len, replpool_id.gtmgbldir);
|
|
else if (sgmnt_found)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MURPOOLRNDWNFL, 4, res_name[0], &res_name[1],
|
|
tran_name->len, replpool_id.gtmgbldir);
|
|
return FALSE;
|
|
}
|
|
}
|
|
# endif
|
|
}
|
|
for (murgbl.reg_full_total = 0, rctl = mur_ctl, rctl_top = mur_ctl + max_reg_total;
|
|
rctl < rctl_top; rctl++, curr = curr->next)
|
|
{
|
|
rctl->initialized = FALSE;
|
|
rctl->gd = curr->gd; /* region structure is already set with proper values */
|
|
rctl->standalone = FALSE;
|
|
rctl->csa = NULL;
|
|
rctl->csd = NULL;
|
|
rctl->jctl = rctl->jctl_head = rctl->jctl_alt_head = rctl->jctl_turn_around = rctl->jctl_apply_pblk = NULL;
|
|
murgbl.reg_full_total++; /* mur_close_files() expects rctl->csa and rctl->jctl to be initialized.
|
|
* so consider this rctl only after those have been initialized. */
|
|
/* Do region specific initialization */
|
|
init_hashtab_mname(&rctl->gvntab, 0, HASHTAB_NO_COMPACT, HASHTAB_NO_SPARE_TABLE); /* for mur_forward() */
|
|
rctl->db_ctl = (file_control *)malloc(SIZEOF(file_control));
|
|
memset(rctl->db_ctl, 0, SIZEOF(file_control));
|
|
mur_rctl_desc_alloc(rctl); /* Allocate rctl->mur_desc associated buffers */
|
|
/* For redirect we just need to change the name of database. recovery will redirect to new database file */
|
|
if (mur_options.redirect)
|
|
{
|
|
for (rl_ptr = mur_options.redirect; rl_ptr != NULL; rl_ptr = rl_ptr->next)
|
|
{
|
|
if (curr->gd->dyn.addr->fname_len == rl_ptr->org_name_len &&
|
|
0 == memcmp(curr->gd->dyn.addr->fname, rl_ptr->org_name, rl_ptr->org_name_len))
|
|
{
|
|
curr->gd->dyn.addr->fname_len = rl_ptr->new_name_len;
|
|
memcpy(curr->gd->dyn.addr->fname, rl_ptr->new_name, curr->gd->dyn.addr->fname_len);
|
|
curr->gd->dyn.addr->fname[curr->gd->dyn.addr->fname_len] = 0;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (!mupfndfil(rctl->gd, NULL))
|
|
{
|
|
rctl->db_present = FALSE;
|
|
if (mur_options.update || star_specified)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_FILENOTFND, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
} else
|
|
{
|
|
rctl->db_present = TRUE;
|
|
if (mur_options.update)
|
|
{
|
|
gv_cur_region = rctl->gd; /* mu_rndwn_file() assumes gv_cur_region is set in VMS */
|
|
# ifdef UNIX
|
|
if (!jgbl.onlnrlbk)
|
|
{
|
|
# endif
|
|
if (!STANDALONE(rctl->gd)) /* STANDALONE macro calls mu_rndwn_file() */
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_MUSTANDALONE, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
rctl->standalone = TRUE;
|
|
# ifdef UNIX
|
|
}
|
|
# endif
|
|
}
|
|
if (mur_options.update || mur_options.extr[GOOD_TN])
|
|
{
|
|
gvcst_init(rctl->gd);
|
|
# ifdef UNIX
|
|
if (jgbl.onlnrlbk)
|
|
{
|
|
TP_CHANGE_REG(rctl->gd);
|
|
if (!cs_data->fully_upgraded)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(6) ERR_ORLBKNOV4BLK, 4, REG_LEN_STR(gv_cur_region),
|
|
DB_LEN_STR(gv_cur_region));
|
|
return FALSE;
|
|
}
|
|
max_epoch_interval = MAX(cs_data->epoch_interval, max_epoch_interval);
|
|
assert(!cs_addrs->hold_onto_crit);
|
|
rctl->standalone = TRUE;
|
|
}
|
|
# endif
|
|
if (mur_options.update)
|
|
{
|
|
assert(rctl->standalone);
|
|
UNIX_ONLY(assert((FILE_INFO(rctl->gd))->grabbed_access_sem));
|
|
if (rctl->gd->read_only)
|
|
{ /* recover/rollback cannot proceed if the process has read-only permissions */
|
|
gtm_putmsg(VARLSTCNT(4) ERR_DBRDONLY, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
assert(!mur_options.update || rctl->standalone);
|
|
assert(mur_options.update || !rctl->standalone);
|
|
}
|
|
assert(murgbl.reg_full_total == max_reg_total);
|
|
DEBUG_ONLY(curr = gld_db_files;)
|
|
# ifdef UNIX
|
|
assert(!jgbl.onlnrlbk || (0 != max_epoch_interval));
|
|
if (jgbl.onlnrlbk)
|
|
{
|
|
inst_requires_rlbk = FALSE;
|
|
udi = FILE_INFO(jnlpool.jnlpool_dummy_reg);
|
|
send_msg(VARLSTCNT(6) ERR_ORLBKSTART, 4, LEN_AND_STR(jnlpool.repl_inst_filehdr->inst_info.this_instname),
|
|
LEN_AND_STR(udi->fn));
|
|
gtm_putmsg(VARLSTCNT(6) ERR_ORLBKSTART, 4, LEN_AND_STR(jnlpool.repl_inst_filehdr->inst_info.this_instname),
|
|
LEN_AND_STR(udi->fn));
|
|
/* Need to get the gtmsource_srv_latch BEFORE grab_crit to avoid deadlocks */
|
|
if (NULL != jnlpool_ctl)
|
|
{
|
|
assert(udi == FILE_INFO(jnlpool.jnlpool_dummy_reg));
|
|
csa = &udi->s_addrs;
|
|
ASSERT_VALID_JNLPOOL(csa);
|
|
assert(INVALID_SEMID != jnlpool.repl_inst_filehdr->jnlpool_semid);
|
|
assert(INVALID_SEMID != jnlpool.repl_inst_filehdr->recvpool_semid);
|
|
assert(INVALID_SEMID != jnlpool.repl_inst_filehdr->jnlpool_shmid);
|
|
gtmsourcelocal_ptr = &jnlpool.gtmsource_local_array[0];
|
|
for (idx = 0; NUM_GTMSRC_LCL > idx; idx++, gtmsourcelocal_ptr++)
|
|
{ /* Get hold of all the gtmsource_srv_latch in all the source server slots in the journal pool. Hold
|
|
* onto it until the end (in mur_close_files).
|
|
*/
|
|
jnlpool.gtmsource_local = gtmsourcelocal_ptr;
|
|
if (!grab_gtmsource_srv_latch(>msourcelocal_ptr->gtmsource_srv_latch,
|
|
2 * max_reg_total * max_epoch_interval, GRAB_GTMSOURCE_SRV_LATCH_ONLY))
|
|
assertpro(FALSE); /* should not reach here due to rts_error in the above function */
|
|
|
|
}
|
|
}
|
|
/* For online rollback we need to grab crit on all the regions. But, this has to be done in the ftok order. To
|
|
* setup the regions in the ftok order invoke insert_region. Note that all we need is a list of regions sorted by
|
|
* the inode/device numbers. So, a bubble sort would have worked just fine. But, since most of the code uses
|
|
* insert_region, we are using it here to avoid code duplication. Note: We could ideally use tp_reg_list here as
|
|
* well.
|
|
*/
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + max_reg_total; rctl < rctl_top; rctl++)
|
|
{
|
|
assert(rctl->gd->open); /* region should have been opened by now */
|
|
rl_new = (onln_rlbk_reg_list *)insert_region(rctl->gd,
|
|
(tp_region **)(®list), NULL, SIZEOF(onln_rlbk_reg_list));
|
|
assert(NULL != rl_new);
|
|
rl_new->rctl = rctl; /* store the backward link to rctl */
|
|
}
|
|
/* The following loop is mostly borrowed from tp_crit_all_regions() */
|
|
TREF(donot_write_inctn_in_wcs_recover) = TRUE; /* donot write INCTN if wcs_recover is called below */
|
|
TREF(wcs_recover_done) = FALSE;
|
|
for (llcnt = 0; ; llcnt++)
|
|
{
|
|
x_lock = TRUE; /* assume success */
|
|
for (rl = reglist; NULL != rl; rl = rl->fPtr)
|
|
{
|
|
reg = rl->reg;
|
|
tmpcsa = &FILE_INFO(reg)->s_addrs;
|
|
tmpcsd = tmpcsa->hdr;
|
|
GRAB_ACCESS_CONTROL(rl);
|
|
grab_crit(reg);
|
|
if (tmpcsd->freeze)
|
|
{
|
|
save_rl = rl;
|
|
rl = rl->fPtr; /* Increment so we release the lock we actually got */
|
|
x_lock = FALSE;
|
|
break;
|
|
}
|
|
}
|
|
if (x_lock)
|
|
break;
|
|
rl_last = rl;
|
|
for (rl = reglist; rl_last != rl; rl = rl->fPtr)
|
|
{
|
|
rel_crit(rl->reg);
|
|
RELEASE_ACCESS_CONTROL(rl);
|
|
}
|
|
assert((NULL != save_rl) && (tmpcsa->region == save_rl->reg));
|
|
GET_CUR_TIME;
|
|
send_msg(VARLSTCNT(8) ERR_ORLBKFRZPROG, 6, CTIME_BEFORE_NL, time_ptr, REG_LEN_STR(save_rl->reg),
|
|
DB_LEN_STR(save_rl->reg));
|
|
gtm_putmsg(VARLSTCNT(8) ERR_ORLBKFRZPROG, 6, CTIME_BEFORE_NL, time_ptr, REG_LEN_STR(save_rl->reg),
|
|
DB_LEN_STR(save_rl->reg));
|
|
while (tmpcsd->freeze)
|
|
{
|
|
if (MAXHARDCRITS < llcnt)
|
|
wcs_sleep(llcnt); /* Don't waste CPU cycles anymore */
|
|
llcnt++;
|
|
}
|
|
GET_CUR_TIME;
|
|
send_msg(VARLSTCNT(8) ERR_ORLBKFRZOVER, 6, CTIME_BEFORE_NL, time_ptr, REG_LEN_STR(save_rl->reg),
|
|
DB_LEN_STR(save_rl->reg));
|
|
gtm_putmsg(VARLSTCNT(8) ERR_ORLBKFRZOVER, 6, CTIME_BEFORE_NL, time_ptr, REG_LEN_STR(save_rl->reg),
|
|
DB_LEN_STR(save_rl->reg));
|
|
}
|
|
inst_requires_rlbk |= TREF(wcs_recover_done);
|
|
assert(x_lock); /* Now we have crit on all the regions (for this global directory) */
|
|
/* Get the replication locks. If there is NO journal pool, then there is nothing more to do as we had
|
|
* already flushed the journal pool in mu_rndwn_replpool. But, if the journal pool exists, then it indicates
|
|
* that processes are still attached to the journal pool. So, grab the journal pool locks, flush the journal
|
|
* pool and set the field in the journal pool indicating that online rollback is in progress and other
|
|
* processes need to back off.
|
|
*/
|
|
if (NULL != jnlpool_ctl)
|
|
{ /* Validate the journal pool is accessible and the offsets of various structures within it are intact */
|
|
grab_lock(jnlpool.jnlpool_dummy_reg, GRAB_LOCK_ONLY);
|
|
csa->hold_onto_crit = TRUE; /* No more unconditional rel_lock() */
|
|
assert(jnlpool.repl_inst_filehdr->crash); /* since we haven't removed the journal pool */
|
|
repl_inst_flush_jnlpool(FALSE, FALSE);
|
|
assert((0 == jnlpool_ctl->onln_rlbk_pid) || !is_proc_alive(jnlpool_ctl->onln_rlbk_pid, 0));
|
|
jnlpool_ctl->onln_rlbk_pid = process_id;
|
|
}
|
|
replinst_file_corrupt = TRUE;
|
|
/* Indicate to all other processes that ONLINE ROLLBACK is now in progress */
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + max_reg_total; rctl < rctl_top; rctl++)
|
|
{
|
|
reg = rctl->gd;
|
|
TP_CHANGE_REG(reg);
|
|
# ifdef DEBUG
|
|
udi = FILE_INFO(reg);
|
|
assert(1 == (semval = semctl(udi->semid, 0, GETVAL)));
|
|
# endif
|
|
assert(cs_addrs->now_crit);
|
|
cs_addrs->hold_onto_crit = TRUE; /* No more unconditional grab_crit/rel_crit on this region */
|
|
/* Do wcs_flu which guarantees that all pending phase 2 commits are done and hardened to disk */
|
|
/* If Online Rollback is invoked right after a crash in the midst of a commit, early_tn
|
|
* can be different from curr_tn (as curr_tn is not incremented until Phase 1 of the commit).
|
|
* A wcs_flu done below has asserts to the effect that it is never invoked with an out-of-sync
|
|
* early_tn and curr_tn. But, Online Rollback is an exception in that it will be holding crit
|
|
* for the entire duration and will be fixing the cache and rolling back the database to a
|
|
* consistent state. So, set the early_tn to curr_tn in case they differ. To avoid unnecessary
|
|
* CPU cycles, set it to curr_tn unconditionally.
|
|
*/
|
|
assert(1 >= (cs_addrs->ti->early_tn - cs_addrs->ti->curr_tn));
|
|
inst_requires_rlbk |= (cs_addrs->ti->early_tn != cs_addrs->ti->curr_tn);
|
|
cs_addrs->ti->early_tn = cs_addrs->ti->curr_tn;
|
|
if (!wcs_flu(WCSFLU_NONE))
|
|
{
|
|
assert(cs_addrs->nl->wcs_phase2_commit_pidcnt); /* only reason why wcs_flu can fail */
|
|
SET_TRACEABLE_VAR(cs_addrs->nl->wc_blocked, TRUE);
|
|
BG_TRACE_PRO_ANY(cs_addrs, wc_blocked_onln_rlbk);
|
|
send_msg(VARLSTCNT(8) ERR_WCBLOCKED, 6, LEN_AND_LIT("wc_blocked_onln_rlbk"),
|
|
process_id, &cs_addrs->ti->curr_tn, DB_LEN_STR(gv_cur_region));
|
|
inst_requires_rlbk = TRUE;
|
|
assert(TREF(donot_write_inctn_in_wcs_recover)); /* should still be set to TRUE */
|
|
wcs_recover(reg);
|
|
/* Now that wcs_recover is done, do a wcs_flu(WCSFLU_NONE) once again. This time we don't expect
|
|
* wcs_flu to error out.
|
|
*/
|
|
if (!wcs_flu(WCSFLU_NONE))
|
|
GTMASSERT;
|
|
}
|
|
assert(0 == cs_addrs->nl->wcs_phase2_commit_pidcnt); /* should be zero after wcs_flu and wcs_recover */
|
|
/* we played with access control lock before, make sure we hold it on all regions now */
|
|
assert(rctl->standalone);
|
|
assert((FILE_INFO(reg))->grabbed_access_sem);
|
|
assert((0 == cs_addrs->nl->onln_rlbk_pid) || !is_proc_alive(cs_addrs->nl->onln_rlbk_pid, 0));
|
|
cs_addrs->nl->onln_rlbk_pid = process_id;
|
|
# ifdef DEBUG
|
|
/* ensure that we don't have any pending journal writes or flushes */
|
|
assert(!JNL_ALLOWED(cs_data) || (NULL != cs_addrs->jnl) && (NULL != cs_addrs->jnl->jnl_buff));
|
|
if (NULL != cs_addrs->jnl)
|
|
{
|
|
jb = cs_addrs->jnl->jnl_buff;
|
|
assert((jb->freeaddr == jb->dskaddr) && (jb->dskaddr == jb->fsync_dskaddr));
|
|
}
|
|
# endif
|
|
if (cs_data->kill_in_prog)
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUKILLIP, 4, DB_LEN_STR(reg), LEN_AND_LIT("ONLINE ROLLBACK"));
|
|
/* Ensure that inhibit_kills is ZERO at this point. This is because, we hold crit at this point and anyone
|
|
* who wants to set inhibit_kills need crit. The reason this is important is because t_end/tp_tend has
|
|
* logic to restart if inhibit_kills is set to TRUE and we don't want online rollback to restart
|
|
*/
|
|
assert(0 == cs_addrs->nl->inhibit_kills);
|
|
}
|
|
TREF(donot_write_inctn_in_wcs_recover) = FALSE;
|
|
}
|
|
# endif
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + max_reg_total; rctl < rctl_top; rctl++)
|
|
{
|
|
if (rctl->db_present)
|
|
{
|
|
if (mur_options.update || mur_options.extr[GOOD_TN])
|
|
{ /* NOTE: Only for collation info extract needs database access */
|
|
DEFER_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES); /* temporarily disable MUPIP STOP/signal handling. */
|
|
|
|
csa = rctl->csa = &FILE_INFO(rctl->gd)->s_addrs;
|
|
csd = rctl->csd = rctl->csa->hdr;
|
|
UNIX_ONLY(assert(!jgbl.onlnrlbk || (csa->now_crit && csa->hold_onto_crit)));
|
|
if (mur_options.update)
|
|
{
|
|
assert(!csa->nl->donotflush_dbjnl UNIX_ONLY(|| jgbl.onlnrlbk));
|
|
csa->nl->donotflush_dbjnl = TRUE; /* indicate gds_rundown/mu_rndwn_file to not wcs_flu()
|
|
* this shared memory until recover/rlbk cleanly exits */
|
|
}
|
|
assert(!JNL_ENABLED(csd) || 0 == csd->jnl_file_name[csd->jnl_file_len]);
|
|
rctl->db_ctl->file_type = rctl->gd->dyn.addr->file_cntl->file_type;
|
|
rctl->db_ctl->file_info = rctl->gd->dyn.addr->file_cntl->file_info;
|
|
rctl->recov_interrupted = csd->recov_interrupted;
|
|
if (mur_options.update && rctl->recov_interrupted)
|
|
{ /* interrupted recovery might have changed current csd's jnl_state/repl_state.
|
|
* restore the state of csd before the start of interrupted recovery.
|
|
*/
|
|
if (mur_options.forward)
|
|
{ /* error out. need fresh backup of database for forward recovery */
|
|
gtm_putmsg(VARLSTCNT(4) ERR_MUPJNLINTERRUPT, 2, DB_LEN_STR(rctl->gd));
|
|
ENABLE_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES);
|
|
return FALSE;
|
|
}
|
|
/* In case rollback with non-zero resync_seqno got interrupted, we would have
|
|
* written intrpt_recov_resync_seqno. If so, cannot use RECOVER now.
|
|
* In all other cases, intrpt_recov_resolve_time would have been written.
|
|
*/
|
|
if (!mur_options.rollback)
|
|
{
|
|
interrupted_rollback = FALSE;
|
|
if (csd->intrpt_recov_resync_seqno)
|
|
interrupted_rollback = TRUE;
|
|
# ifdef UNIX
|
|
else
|
|
{
|
|
for (idx = 0; idx < MAX_SUPPL_STRMS; idx++)
|
|
{
|
|
if (csd->intrpt_recov_resync_strm_seqno[idx])
|
|
{
|
|
interrupted_rollback = TRUE;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
# endif
|
|
if (interrupted_rollback)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_ROLLBKINTERRUPT, 2, DB_LEN_STR(rctl->gd));
|
|
ENABLE_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES);
|
|
return FALSE;
|
|
}
|
|
}
|
|
csd->jnl_state = csd->intrpt_recov_jnl_state;
|
|
csd->repl_state = csd->intrpt_recov_repl_state;
|
|
}
|
|
/* Save current states */
|
|
rctl->jnl_state = csd->jnl_state;
|
|
rctl->repl_state = csd->repl_state;
|
|
rctl->before_image = csd->jnl_before_image;
|
|
rctl->initialized = TRUE;
|
|
ENABLE_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES); /* reenable the interrupts */
|
|
if (mur_options.update)
|
|
{
|
|
if (!mur_options.rollback)
|
|
{
|
|
if (!mur_options.forward && !JNL_ENABLED(csd))
|
|
{
|
|
if (!star_specified)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_JNLSTATEOFF, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
continue;
|
|
}
|
|
} else
|
|
{
|
|
if (!REPL_ENABLED(csd))
|
|
{ /* Replication is either OFF or WAS_ON. Journaling could be ENABLED or not.
|
|
* If replication is OFF and journaling is DISABLED, there is no issue.
|
|
* Any other combination (including replication being WAS_ON) is an error
|
|
* as we dont have the complete set of journal records to do the rollback.
|
|
*/
|
|
if (REPL_ALLOWED(csd) || JNL_ENABLED(csd))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_REPLSTATEOFF, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
continue;
|
|
}
|
|
# ifdef UNIX
|
|
else if (!rctl->before_image)
|
|
{ /* Replicated database with NOBEFORE_IMAGE journaling.
|
|
* ROLLBACK is allowed only if -FETCHRESYNC or -RESYNC is specified.
|
|
*/
|
|
if (!mur_options.fetchresync_port && !mur_options.resync_specified)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_RLBKNOBIMG, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
mur_options.rollback_losttnonly = TRUE;
|
|
/* Since we won't be touching the journal pool/file there is no question
|
|
* of leaving things in a corrupt state.
|
|
*/
|
|
replinst_file_corrupt = FALSE;
|
|
}
|
|
# endif
|
|
}
|
|
if (csd->freeze UNIX_ONLY(&& !jgbl.onlnrlbk))
|
|
{ /* region_freeze should release freeze here. For ONLINE ROLLBACK we would have
|
|
* waited for the freeze to be lifted off before */
|
|
reg_frz_status = region_freeze(rctl->gd, FALSE, TRUE, FALSE);
|
|
assert (0 == rctl->csa->hdr->freeze);
|
|
assert(REG_FREEZE_SUCCESS == reg_frz_status);
|
|
if (REG_ALREADY_FROZEN == reg_frz_status)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_DBFRZRESETFL, 2, DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
gtm_putmsg(VARLSTCNT(4) ERR_DBFRZRESETSUC, 2, DB_LEN_STR(rctl->gd));
|
|
}
|
|
/* save current jnl/repl state before changing in case recovery is interrupted */
|
|
csd->intrpt_recov_jnl_state = csd->jnl_state;
|
|
csd->intrpt_recov_repl_state = csd->repl_state;
|
|
csd->recov_interrupted = TRUE;
|
|
/* Temporarily change current state. mur_close_files() will restore them as appropriate */
|
|
if (mur_options.forward && JNL_ENABLED(csd))
|
|
csd->jnl_state = jnl_closed;
|
|
csd->repl_state = repl_closed;
|
|
csd->file_corrupt = TRUE;
|
|
/* flush the changed csd to disk */
|
|
fc = rctl->gd->dyn.addr->file_cntl;
|
|
fc->op = FC_WRITE;
|
|
fc->op_buff = (sm_uc_ptr_t)csd;
|
|
fc->op_len = (int)ROUND_UP(SIZEOF_FILE_HDR(csd), DISK_BLOCK_SIZE);
|
|
fc->op_pos = 1;
|
|
dbfilop(fc);
|
|
}
|
|
rctl->db_tn = csd->trans_hist.curr_tn;
|
|
/* Some routines use csa */
|
|
csa->jnl_state= csd->jnl_state;
|
|
csa->repl_state = csd->repl_state;
|
|
csa->jnl_before_image = csd->jnl_before_image;
|
|
} else
|
|
{ /* temporarily disable MUPIP STOP/signal handling. */
|
|
DEFER_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES);
|
|
|
|
/* NOTE: csa field is NULL, if we do not open database */
|
|
csd = rctl->csd = (sgmnt_data_ptr_t)malloc(SGMNT_HDR_LEN);
|
|
assert(0 == rctl->gd->dyn.addr->fname[rctl->gd->dyn.addr->fname_len]);
|
|
/* 1) show 2) extract 3) verify action does not need standalone access.
|
|
* In this case csa is NULL */
|
|
if (!file_head_read((char *)rctl->gd->dyn.addr->fname, rctl->csd, SGMNT_HDR_LEN))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(4) ERR_DBFILOPERR, 2, REG_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
rctl->jnl_state = csd->jnl_state;
|
|
rctl->repl_state = csd->repl_state;
|
|
rctl->before_image = csd->jnl_before_image;
|
|
rctl->initialized = TRUE;
|
|
ENABLE_INTERRUPTS(INTRPT_IN_MUR_OPEN_FILES); /* reenable the interrupts */
|
|
}
|
|
/* For star_specified we open journal files here.
|
|
* For star_specified we cannot do anything if journaling is disabled */
|
|
if (star_specified && JNL_ALLOWED(csd))
|
|
{
|
|
jctl = (jnl_ctl_list *)malloc(SIZEOF(jnl_ctl_list));
|
|
memset(jctl, 0, SIZEOF(jnl_ctl_list));
|
|
rctl->jctl_head = rctl->jctl = jctl;
|
|
jctl->jnl_fn_len = csd->jnl_file_len;
|
|
memcpy(jctl->jnl_fn, csd->jnl_file_name, csd->jnl_file_len);
|
|
jctl->jnl_fn[jctl->jnl_fn_len] = 0;
|
|
/* If system crashed during rename, following will fix it .
|
|
* Following function is directly related to cre_jnl_file_common */
|
|
cre_jnl_file_intrpt_rename(jctl->jnl_fn_len, jctl->jnl_fn);
|
|
if (!mur_fopen(jctl))
|
|
{
|
|
return FALSE;
|
|
}
|
|
if (SS_NORMAL != (jctl->status = mur_fread_eof(jctl, rctl)))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(9) ERR_JNLBADRECFMT, 3, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
jctl->rec_offset, ERR_TEXT, 2, LEN_AND_LIT("mur_fread_eof failed"));
|
|
return FALSE;
|
|
}
|
|
assert((csa == rctl->csa) || !mur_options.update);
|
|
# ifdef UNIX
|
|
if (jgbl.onlnrlbk && jctl->jfh->crash
|
|
&& !csa->dbinit_shm_created && !jctl->jfh->recover_interrupted
|
|
&& !inst_requires_rlbk)
|
|
{ /* If the journal file is crashed, mur_fread_eof invokes mur_fread_eof_crash to read the
|
|
* last valid record from the journal file and marks the journal file as NOT properly
|
|
* closed. However, for online rollback, if the shared memory exists and the journal file
|
|
* crashed, we can still consider it as a no-crash scenario as long as the following
|
|
* conditions are met:
|
|
* 1. journal file is not created by a previously interrupted recovery
|
|
* 2. wcs_recover did NOT encounter a DBDANGER situation
|
|
*/
|
|
jctl->properly_closed = TRUE;
|
|
}
|
|
if (mur_options.verbose)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOSTR, 4, LEN_AND_LIT("Module : mur_open_files"),
|
|
LEN_AND_LIT("Post mur_fread_eof details"));
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOSTR, 4, LEN_AND_LIT(" Journal file"),
|
|
JNL_LEN_STR(rctl->csd));
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOUINT4, 4, LEN_AND_LIT(" Last valid record offset"),
|
|
jctl->lvrec_off, jctl->lvrec_off);
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOUINT4, 4, LEN_AND_LIT(" Last valid record time"),
|
|
jctl->lvrec_time, jctl->lvrec_time);
|
|
verbose_ptr = jctl->tail_analysis ? "TRUE" : "FALSE";
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOSTR, 4, LEN_AND_LIT(" Tail analysis done"),
|
|
LEN_AND_STR(verbose_ptr));
|
|
verbose_ptr = jctl->properly_closed ? "TRUE" : "FALSE";
|
|
gtm_putmsg(VARLSTCNT(6) ERR_MUINFOSTR, 4, LEN_AND_LIT(" Properly closed"),
|
|
LEN_AND_STR(verbose_ptr));
|
|
}
|
|
# endif
|
|
if (!is_file_identical((char *)jctl->jfh->data_file_name, (char *)rctl->gd->dyn.addr->fname))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(8) ERR_DBJNLNOTMATCH, 6, DB_LEN_STR(rctl->gd),
|
|
jctl->jnl_fn_len, jctl->jnl_fn,
|
|
jctl->jfh->data_file_name_length, jctl->jfh->data_file_name);
|
|
return FALSE;
|
|
}
|
|
}
|
|
} /* End rctl->db_present */
|
|
} /* End for */
|
|
UNIX_ONLY(
|
|
if (jgbl.mur_rollback)
|
|
jnlpool.repl_inst_filehdr->file_corrupt = replinst_file_corrupt;
|
|
)
|
|
/* At this point mur_ctl[] has been created from the current global directory database file names
|
|
* or from the journal file header's database names.
|
|
* For star_specified == TRUE implicitly only current generation journal files are specified and already opened
|
|
* For star_specified == FALSE user can specify multiple generations. We need to sort them */
|
|
if (!star_specified)
|
|
{
|
|
jnlno = 0;
|
|
cptr = jnl_file_list;
|
|
ctop = &jnl_file_list[jnl_file_list_len];
|
|
while (cptr < ctop)
|
|
{
|
|
jctl = (jnl_ctl_list *)malloc(SIZEOF(jnl_ctl_list));
|
|
memset(jctl, 0, SIZEOF(jnl_ctl_list));
|
|
cptr_last = cptr;
|
|
while (0 != *cptr && ',' != *cptr && '"' != *cptr && ' ' != *cptr)
|
|
++cptr;
|
|
if (!get_full_path(cptr_last, (unsigned int)(cptr - cptr_last),
|
|
(char *)jctl->jnl_fn, &jctl->jnl_fn_len, MAX_FN_LEN, &jctl->status2))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(5) ERR_FILEPARSE, 2, cptr_last, cptr - cptr_last, jctl->status2);
|
|
return FALSE;
|
|
}
|
|
cptr++; /* skip separator */
|
|
/* Note cre_jnl_file_intrpt_rename was already called in mur_db_files_from_jnllist */
|
|
if (!mur_fopen(jctl)) /* dont know rctl yet */
|
|
{
|
|
return FALSE;
|
|
}
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + murgbl.reg_full_total; rctl < rctl_top; rctl++)
|
|
{
|
|
if (rctl->gd->dyn.addr->fname_len == jctl->jfh->data_file_name_length &&
|
|
(0 == memcmp(jctl->jfh->data_file_name, rctl->gd->dyn.addr->fname,
|
|
rctl->gd->dyn.addr->fname_len)))
|
|
break;
|
|
}
|
|
if (rctl == rctl_top)
|
|
{
|
|
for (rl_ptr = mur_options.redirect; (NULL != rl_ptr); rl_ptr = rl_ptr->next)
|
|
{
|
|
if ((jctl->jfh->data_file_name_length == rl_ptr->org_name_len)
|
|
&& (0 == memcmp(jctl->jfh->data_file_name,
|
|
rl_ptr->org_name, rl_ptr->org_name_len)))
|
|
break;
|
|
}
|
|
if (NULL != rl_ptr)
|
|
{
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + murgbl.reg_full_total; rctl < rctl_top; rctl++)
|
|
{
|
|
if (rctl->gd->dyn.addr->fname_len == rl_ptr->new_name_len &&
|
|
(0 == memcmp(rctl->gd->dyn.addr->fname, rl_ptr->new_name,
|
|
rl_ptr->new_name_len)))
|
|
break;
|
|
}
|
|
}
|
|
if (rctl == rctl_top)
|
|
GTMASSERT;/* db list was created from journal file header. So it is not possible */
|
|
}
|
|
/* Detect and report 1st case of any duplicated files in mupip forward recovery command. */
|
|
if (mur_options.forward)
|
|
{
|
|
VMS_ONLY(set_gdid_from_file(&jctl->fid, (char *)jctl->jnl_fn, jctl->jnl_fn_len);)
|
|
# if defined(UNIX)
|
|
if (filename_to_id(&jctl->fid, (char *)jctl->jnl_fn))
|
|
{
|
|
# endif
|
|
for (temp_jctl = rctl->jctl_head; temp_jctl; temp_jctl = temp_jctl->next_gen)
|
|
{
|
|
if (UNIX_ONLY(is_gdid_identical(&jctl->fid, &temp_jctl->fid))
|
|
VMS_ONLY(is_gdid_gdid_identical(&jctl->fid, &temp_jctl->fid)))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(6) ERR_JNLFILEDUP, 4, jctl->jnl_fn_len,
|
|
jctl->jnl_fn, temp_jctl->jnl_fn_len, temp_jctl->jnl_fn);
|
|
return FALSE;
|
|
}
|
|
}
|
|
# if defined(UNIX)
|
|
}
|
|
else
|
|
{
|
|
gtm_putmsg(VARLSTCNT(11) ERR_JNLFILEOPNERR, 2, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
ERR_SYSCALL, 5, LEN_AND_LIT("fstat"), CALLFROM, errno);
|
|
return FALSE;
|
|
}
|
|
# endif
|
|
}
|
|
if (SS_NORMAL != (jctl->status = mur_fread_eof(jctl, rctl)))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(5) ERR_JNLBADRECFMT, 3, jctl->jnl_fn_len, jctl->jnl_fn, jctl->rec_offset);
|
|
return FALSE;
|
|
}
|
|
/* Now, we have found the region for this jctl */
|
|
csd = rctl->csd;
|
|
if (!mur_options.forward)
|
|
{
|
|
rctl->jctl = rctl->jctl_head = jctl;
|
|
if (mur_options.update && !is_file_identical((char *)csd->jnl_file_name, (char *)jctl->jnl_fn))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(8) ERR_JNLNMBKNOTPRCD, 6, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
JNL_LEN_STR(csd), DB_LEN_STR(rctl->gd));
|
|
return FALSE;
|
|
}
|
|
} else
|
|
{ /* rctl->jctl_head will have the lowest bov_tn of the journals of the region
|
|
* Then next_gen items will be non-decreasing order of bov_tn */
|
|
if (NULL == rctl->jctl_head)
|
|
{
|
|
assert(NULL == rctl->jctl);
|
|
rctl->jctl = rctl->jctl_head = jctl;
|
|
} else
|
|
{
|
|
temp_jctl = jctl;
|
|
jctl = rctl->jctl_head;
|
|
if (temp_jctl->jfh->bov_tn < jctl->jfh->bov_tn ||
|
|
(temp_jctl->jfh->bov_tn == jctl->jfh->bov_tn &&
|
|
temp_jctl->jfh->eov_tn < jctl->jfh->eov_tn))
|
|
{
|
|
assert(NULL == jctl->prev_gen);
|
|
temp_jctl->prev_gen = NULL;
|
|
temp_jctl->next_gen = jctl;
|
|
jctl->prev_gen = temp_jctl;
|
|
rctl->jctl_head = temp_jctl;
|
|
} else
|
|
{
|
|
while (NULL != jctl->next_gen &&
|
|
((jctl->next_gen->jfh->bov_tn < temp_jctl->jfh->bov_tn) ||
|
|
(jctl->next_gen->jfh->bov_tn == temp_jctl->jfh->bov_tn &&
|
|
jctl->next_gen->jfh->eov_tn < temp_jctl->jfh->eov_tn)))
|
|
jctl = jctl->next_gen ;
|
|
temp_jctl->next_gen = jctl->next_gen;
|
|
temp_jctl->prev_gen = jctl;
|
|
if (NULL != jctl->next_gen)
|
|
jctl->next_gen->prev_gen = temp_jctl;
|
|
jctl->next_gen = temp_jctl;
|
|
}
|
|
}
|
|
} /* mur_options.forward */
|
|
} /* for jnlno */
|
|
}
|
|
|
|
/* If not all regions of a global directory are processed, we shrink mur_ctl array and conserve space.
|
|
* It is specially needed for later code */
|
|
murgbl.reg_total = murgbl.reg_full_total;
|
|
for (regno = 0; regno < murgbl.reg_total; regno++)
|
|
{
|
|
if (NULL == mur_ctl[regno].jctl)
|
|
{
|
|
for (--murgbl.reg_total; murgbl.reg_total > regno; murgbl.reg_total--)
|
|
{
|
|
rctl = &mur_ctl[murgbl.reg_total];
|
|
if (NULL != (jctl = rctl->jctl_head))
|
|
{
|
|
assert(jctl == rctl->jctl); /* rctl->jctl and rctl->jctl_head should be same now */
|
|
tmp_rctl = mur_ctl[regno];
|
|
mur_ctl[regno] = *rctl;
|
|
*rctl = tmp_rctl;
|
|
rctl = &mur_ctl[regno];
|
|
MUR_FIX_JCTL_BACK_POINTER_TO_RCTL(jctl, rctl, &mur_ctl[murgbl.reg_total], TRUE);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
assert(murgbl.reg_full_total == max_reg_total);
|
|
if (!mur_options.rollback && murgbl.reg_total < murgbl.reg_full_total)
|
|
gtm_putmsg(VARLSTCNT (1) ERR_NOTALLJNLEN);
|
|
else if (mur_options.rollback && murgbl.reg_total < murgbl.reg_full_total)
|
|
gtm_putmsg(VARLSTCNT (1) ERR_NOTALLREPLON);
|
|
if (0 == murgbl.reg_total)
|
|
return FALSE;
|
|
/* From this point consider only regions with journals to be processed (murgbl.reg_total)
|
|
* However mur_close_files will close all regions opened (murgbl.reg_full_total) */
|
|
for (rctl = mur_ctl, rctl_top = mur_ctl + murgbl.reg_total; rctl < rctl_top; rctl++)
|
|
{
|
|
jctl = rctl->jctl_head;
|
|
if (mur_options.update)
|
|
{
|
|
csd = rctl->csd;
|
|
if (mur_options.chain && mur_options.forward)
|
|
{ /* User might have not specified journal file starting tn matching database curr_tn.
|
|
* So try to open previous generation journal files and add to linked list */
|
|
rctl->jctl = jctl; /* asserted by mur_insert_prev */
|
|
while (jctl->jfh->bov_tn > csd->trans_hist.curr_tn)
|
|
{
|
|
if (0 == jctl->jfh->prev_jnl_file_name_length)
|
|
{
|
|
gtm_putmsg(VARLSTCNT(11) ERR_JNLDBTNNOMATCH, 9,jctl->jnl_fn_len, jctl->jnl_fn,
|
|
LEN_AND_LIT("beginning"), &jctl->jfh->bov_tn,
|
|
DB_LEN_STR(rctl->gd), &csd->trans_hist.curr_tn, &csd->jnl_eovtn);
|
|
gtm_putmsg(VARLSTCNT(4) ERR_NOPREVLINK, 2,
|
|
jctl->jnl_fn_len, jctl->jnl_fn);
|
|
return FALSE;
|
|
} else if (!mur_insert_prev(&jctl))
|
|
return FALSE;
|
|
}
|
|
}
|
|
if (mur_options.forward)
|
|
{
|
|
if (!mur_options.notncheck && (jctl->jfh->bov_tn != csd->trans_hist.curr_tn))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(11) ERR_JNLDBTNNOMATCH, 9, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
LEN_AND_LIT("beginning"), &jctl->jfh->bov_tn,
|
|
DB_LEN_STR(rctl->gd), &csd->trans_hist.curr_tn, &csd->jnl_eovtn);
|
|
return FALSE;
|
|
}
|
|
} else /* Backward Recovery */
|
|
{
|
|
if (jctl->jfh->eov_tn != csd->trans_hist.curr_tn)
|
|
{ /* 'outofsync' variable identifies situations in which backward recovery
|
|
* proceeds if inequality (csd->jnl_eovtn <= jfh->eov_tn <= csd->curr_tn) is TRUE.
|
|
* So if,
|
|
* i) backward recovery is interrupted at any time except at turn around point just after
|
|
* database header is synched OR
|
|
*ii) database is crashed but journaling is behind database i.e.
|
|
* jfh->eov_tn < csd->trans_hist.curr_tn
|
|
* outofsync is set to TRUE.
|
|
* backward recovery does not proceed if,
|
|
* i) database is crashed and journaling is ahead of database
|
|
* ii) database is cleanly terminated and outofsync is FALSE
|
|
*iii) outofsync is TRUE but above mentioned inequality is FALSE and
|
|
* interruption or crash did not occur while processing turn around point
|
|
*/
|
|
outofsync = (rctl->recov_interrupted ||
|
|
(jctl->jfh->crash && (jctl->jfh->eov_tn < csd->trans_hist.curr_tn)));
|
|
if ((jctl->jfh->crash && (jctl->jfh->eov_tn > csd->trans_hist.curr_tn) &&
|
|
!rctl->recov_interrupted) || (!jctl->jfh->crash && !outofsync) ||
|
|
(outofsync && !csd->turn_around_point && (csd->jnl_eovtn != csd->trans_hist.curr_tn)
|
|
&& (csd->jnl_eovtn > jctl->jfh->eov_tn)))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(11) ERR_JNLDBTNNOMATCH, 9, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
LEN_AND_LIT("end"), &jctl->jfh->eov_tn, DB_LEN_STR(rctl->gd),
|
|
&csd->trans_hist.curr_tn, &csd->jnl_eovtn);
|
|
return FALSE;
|
|
}
|
|
}
|
|
}
|
|
} /* if mur_options.update */
|
|
if (mur_options.extr[GOOD_TN])
|
|
{
|
|
csa = rctl->csa;
|
|
if (NULL != csa)
|
|
{
|
|
# if (defined(DEBUG) && defined(VMS))
|
|
/* set wc_blocked as true to invoke wcs_recover */
|
|
GTM_WHITE_BOX_TEST(WBTEST_SET_WC_BLOCKED, csa->nl->wc_blocked, TRUE);
|
|
# endif
|
|
if (csa->nl->wc_blocked)
|
|
TREF(donot_write_inctn_in_wcs_recover) = TRUE;
|
|
}
|
|
}
|
|
while (NULL != jctl->next_gen) /* Check for continuity */
|
|
{
|
|
if (!mur_options.notncheck && (jctl->next_gen->jfh->bov_tn != jctl->jfh->eov_tn))
|
|
{
|
|
gtm_putmsg(VARLSTCNT(8) ERR_JNLTNOUTOFSEQ, 6,
|
|
&jctl->jfh->eov_tn, jctl->jnl_fn_len, jctl->jnl_fn,
|
|
&jctl->next_gen->jfh->bov_tn, jctl->next_gen->jnl_fn_len, jctl->next_gen->jnl_fn);
|
|
return FALSE;
|
|
}
|
|
jctl = jctl->next_gen;
|
|
}
|
|
rctl->jctl = jctl; /* latest in linked list */
|
|
} /* end for */
|
|
return TRUE;
|
|
}
|