#!/usr/bin/env python # # Public Domain 2014-present MongoDB, Inc. # Public Domain 2008-2014 WiredTiger, Inc. # # This is free and unencumbered software released into the public domain. # # Anyone is free to copy, modify, publish, use, compile, sell, or # distribute this software, either in source code form or as a compiled # binary, for any purpose, commercial or non-commercial, and by any # means. # # In jurisdictions that recognize copyright laws, the author or authors # of this software dedicate any and all copyright interest in the # software to the public domain. We make this dedication for the benefit # of the public at large and to the detriment of our heirs and # successors. We intend this dedication to be an overt act of # relinquishment in perpetuity of all present and future rights to this # software under copyright law. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, # EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF # MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. # IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR # OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, # ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR # OTHER DEALINGS IN THE SOFTWARE. # # test_timestamp07.py # Timestamps: checkpoints. # from helper import copy_wiredtiger_home import random from suite_subprocess import suite_subprocess import wiredtiger, wttest from wtscenario import make_scenarios def timestamp_str(t): return '%x' % t class test_timestamp07(wttest.WiredTigerTestCase, suite_subprocess): tablename = 'ts07_ts_nologged' tablename2 = 'ts07_nots_logged' tablename3 = 'ts07_ts_logged' types = [ ('file', dict(uri='file:', use_cg=False, use_index=False)), ('table-cg', dict(uri='table:', use_cg=True, use_index=False)), ] conncfg = [ ('nolog', dict(conn_config='create,cache_size=2M', using_log=False)), ('log', dict(conn_config='create,log=(file_max=1M,archive=false,enabled),cache_size=2M', using_log=True)), ] session_config = 'isolation=snapshot' nkeys = [ ('100keys', dict(nkeys=100)), ('500keys', dict(nkeys=500)), ('1000keys', dict(nkeys=1000)), ] scenarios = make_scenarios(types, conncfg, nkeys) # Binary values. value = u'\u0001\u0002abcd\u0007\u0004' value2 = u'\u0001\u0002dcba\u0007\u0004' value3 = u'\u0001\u0002cdef\u0007\u0004' # Check that a cursor (optionally started in a new transaction), sees the # expected value for a key def check(self, session, txn_config, k, expected): if txn_config: session.begin_transaction(txn_config) c = session.open_cursor(self.uri + self.tablename, None) if not expected: c.set_key(k) self.assertEqual(c.search(), wiredtiger.WT_NOTFOUND) else: self.assertEqual(c[k], expected) c.close() if txn_config: session.commit_transaction() # Check reads of all tables at a timestamp def check_reads(self, session, txn_config, check_value, valcnt, valcnt2, valcnt3): if txn_config: session.begin_transaction(txn_config) c = session.open_cursor(self.uri + self.tablename, None) c2 = session.open_cursor(self.uri + self.tablename2, None) c3 = session.open_cursor(self.uri + self.tablename3, None) count = 0 for k, v in c: if check_value in str(v): count += 1 c.close() count2 = 0 for k, v in c2: if check_value in str(v): count2 += 1 c2.close() count3 = 0 for k, v in c3: if check_value in str(v): count3 += 1 c3.close() if txn_config: session.commit_transaction() self.assertEqual(count, valcnt) self.assertEqual(count2, valcnt2) self.assertEqual(count3, valcnt3) # # Take a backup of the database and verify that the value we want to # check exists in the tables the expected number of times. # def backup_check(self, check_value, valcnt, valcnt2, valcnt3): newdir = "BACKUP" copy_wiredtiger_home(self, '.', newdir, True) conn = self.setUpConnectionOpen(newdir) session = self.setUpSessionOpen(conn) c = session.open_cursor(self.uri + self.tablename, None) c2 = session.open_cursor(self.uri + self.tablename2, None) c3 = session.open_cursor(self.uri + self.tablename3, None) # Count how many times the second value is present count = 0 for k, v in c: if check_value in str(v): # print "check_value found in key " + str(k) count += 1 c.close() # Count how many times the second value is present in the # non-timestamp table. count2 = 0 for k, v in c2: if check_value in str(v): # print "check_value found in key " + str(k) count2 += 1 c2.close() # Count how many times the second value is present in the # logged timestamp table. count3 = 0 for k, v in c3: if check_value in str(v): count3 += 1 c3.close() conn.close() # print "CHECK BACKUP: Count " + str(count) + " Count2 " + str(count2) + " Count3 " + str(count3) # print "CHECK BACKUP: Expect value2 count " + str(valcnt) # print "CHECK BACKUP: 2nd table Expect value2 count " + str(valcnt2) # print "CHECK BACKUP: 3rd table Expect value2 count " + str(valcnt3) self.assertEqual(count, valcnt) self.assertEqual(count2, valcnt2) self.assertEqual(count3, valcnt3) # Check that a cursor sees the expected values after a checkpoint. def ckpt_backup(self, check_value, valcnt, valcnt2, valcnt3): # Take a checkpoint. Make a copy of the database. Open the # copy and verify whether or not the expected data is in there. ckptcfg = 'use_timestamp=true' self.session.checkpoint(ckptcfg) self.backup_check(check_value, valcnt, valcnt2, valcnt3) def check_stable(self, check_value, valcnt, valcnt2, valcnt3): self.ckpt_backup(check_value, valcnt, valcnt2, valcnt3) # When reading as-of a timestamp, tables 1 and 3 should match (both # use timestamps and we're not running recovery, so logging behavior # should be irrelevant). self.check_reads(self.session, 'read_timestamp=' + self.stablets, check_value, valcnt, valcnt2, valcnt) def test_timestamp07(self): uri = self.uri + self.tablename uri2 = self.uri + self.tablename2 uri3 = self.uri + self.tablename3 # # Open three tables: # 1. Table is not logged and uses timestamps. # 2. Table is logged and does not use timestamps. # 3. Table is logged and uses timestamps. # self.session.create(uri, 'key_format=i,value_format=S,log=(enabled=false)') c = self.session.open_cursor(uri) self.session.create(uri2, 'key_format=i,value_format=S') c2 = self.session.open_cursor(uri2) self.session.create(uri3, 'key_format=i,value_format=S') c3 = self.session.open_cursor(uri3) # print "tables created" # Insert keys 1..nkeys each with timestamp=key, in some order. orig_keys = list(range(1, self.nkeys+1)) keys = orig_keys[:] random.shuffle(keys) for k in keys: c2[k] = self.value self.session.begin_transaction() c[k] = self.value c3[k] = self.value self.session.commit_transaction('commit_timestamp=' + timestamp_str(k)) # print "value inserted in all tables, reading..." # Now check that we see the expected state when reading at each # timestamp. for k in orig_keys: self.check(self.session, 'read_timestamp=' + timestamp_str(k), k, self.value) self.check(self.session, 'read_timestamp=' + timestamp_str(k), k + 1, None) # print "all values read, updating timestamps" # Bump the oldest timestamp, we're not going back... self.assertTimestampsEqual(self.conn.query_timestamp(), timestamp_str(self.nkeys)) self.oldts = self.stablets = timestamp_str(self.nkeys) self.conn.set_timestamp('oldest_timestamp=' + self.oldts) self.conn.set_timestamp('stable_timestamp=' + self.stablets) # print "Oldest " + self.oldts # print "inserting value2 in all tables" # Update them and retry. random.shuffle(keys) count = 0 for k in keys: # Make sure a timestamp cursor is the last one to update. This # tests the scenario for a bug we found where recovery replayed # the last record written into the log. # # print "Key " + str(k) + " to value2" c2[k] = self.value2 self.session.begin_transaction() c[k] = self.value2 c3[k] = self.value2 ts = timestamp_str(k + self.nkeys) self.session.commit_transaction('commit_timestamp=' + ts) # print "Commit key " + str(k) + " ts " + ts count += 1 # print "Updated " + str(count) + " keys to value2" # Take a checkpoint using the given configuration. Then verify # whether value2 appears in a copy of that data or not. # print "check_stable 1" self.check_stable(self.value2, 0, self.nkeys, self.nkeys if self.using_log else 0) # Update the stable timestamp to the latest, but not the oldest # timestamp and make sure we can see the data. Once the stable # timestamp is moved we should see all keys with value2. self.stablets = timestamp_str(self.nkeys*2) self.conn.set_timestamp('stable_timestamp=' + self.stablets) # print "check_stable 2" self.check_stable(self.value2, self.nkeys, self.nkeys, self.nkeys) # If we're not using the log we're done. if not self.using_log: return # Update the key and retry. This time take a backup and recover. random.shuffle(keys) count = 0 for k in keys: # Make sure a timestamp cursor is the last one to update. This # tests the scenario for a bug we found where recovery replayed # the last record written into the log. # # print "Key " + str(k) + " to value3" c2[k] = self.value3 self.session.begin_transaction() c[k] = self.value3 c3[k] = self.value3 ts = timestamp_str(k + self.nkeys*2) self.session.commit_transaction('commit_timestamp=' + ts) # print "Commit key " + str(k) + " ts " + ts count += 1 # print "Updated " + str(count) + " keys to value3" # Flush the log but don't checkpoint self.session.log_flush('sync=on') # Take a backup and then verify whether value3 appears in a copy # of that data or not. Both tables that are logged should see # all the data regardless of timestamps. The table that is not # logged should not see any of it. # print "check_stable 3" self.check_stable(self.value3, 0, self.nkeys, self.nkeys) if __name__ == '__main__': wttest.run()