create_bwc_index_with_some_ancient_segments.py 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113
  1. import create_bwc_index
  2. import logging
  3. import os
  4. import random
  5. import shutil
  6. import subprocess
  7. import sys
  8. import tempfile
  9. def fetch_version(version):
  10. logging.info('fetching ES version %s' % version)
  11. if subprocess.call([sys.executable, os.path.join(os.path.split(sys.argv[0])[0], 'get-bwc-version.py'), version]) != 0:
  12. raise RuntimeError('failed to download ES version %s' % version)
  13. def main():
  14. '''
  15. Creates a static back compat index (.zip) with mixed 0.20 (Lucene 3.x) and 0.90 (Lucene 4.x) segments.
  16. '''
  17. logging.basicConfig(format='[%(levelname)s] [%(asctime)s] %(message)s', level=logging.INFO,
  18. datefmt='%Y-%m-%d %I:%M:%S %p')
  19. logging.getLogger('elasticsearch').setLevel(logging.ERROR)
  20. logging.getLogger('urllib3').setLevel(logging.WARN)
  21. tmp_dir = tempfile.mkdtemp()
  22. try:
  23. data_dir = os.path.join(tmp_dir, 'data')
  24. logging.info('Temp data dir: %s' % data_dir)
  25. first_version = '0.20.6'
  26. second_version = '0.90.6'
  27. index_name = 'index-%s-and-%s' % (first_version, second_version)
  28. # Download old ES releases if necessary:
  29. release_dir = os.path.join('backwards', 'elasticsearch-%s' % first_version)
  30. if not os.path.exists(release_dir):
  31. fetch_version(first_version)
  32. node = create_bwc_index.start_node(first_version, release_dir, data_dir, cluster_name=index_name)
  33. client = create_bwc_index.create_client()
  34. # Creates the index & indexes docs w/ first_version:
  35. create_bwc_index.generate_index(client, first_version, index_name)
  36. # Make sure we write segments:
  37. flush_result = client.indices.flush(index=index_name)
  38. if not flush_result['ok']:
  39. raise RuntimeError('flush failed: %s' % str(flush_result))
  40. segs = client.indices.segments(index=index_name)
  41. shards = segs['indices'][index_name]['shards']
  42. if len(shards) != 1:
  43. raise RuntimeError('index should have 1 shard but got %s' % len(shards))
  44. first_version_segs = shards['0'][0]['segments'].keys()
  45. create_bwc_index.shutdown_node(node)
  46. print('%s server output:\n%s' % (first_version, node.stdout.read().decode('utf-8')))
  47. node = None
  48. release_dir = os.path.join('backwards', 'elasticsearch-%s' % second_version)
  49. if not os.path.exists(release_dir):
  50. fetch_version(second_version)
  51. # Now also index docs with second_version:
  52. node = create_bwc_index.start_node(second_version, release_dir, data_dir, cluster_name=index_name)
  53. client = create_bwc_index.create_client()
  54. # If we index too many docs, the random refresh/flush causes the ancient segments to be merged away:
  55. num_docs = 10
  56. create_bwc_index.index_documents(client, index_name, 'doc', num_docs)
  57. # Make sure we get a segment:
  58. flush_result = client.indices.flush(index=index_name)
  59. if not flush_result['ok']:
  60. raise RuntimeError('flush failed: %s' % str(flush_result))
  61. # Make sure we see mixed segments (it's possible Lucene could have "accidentally" merged away the first_version segments):
  62. segs = client.indices.segments(index=index_name)
  63. shards = segs['indices'][index_name]['shards']
  64. if len(shards) != 1:
  65. raise RuntimeError('index should have 1 shard but got %s' % len(shards))
  66. second_version_segs = shards['0'][0]['segments'].keys()
  67. #print("first: %s" % first_version_segs)
  68. #print("second: %s" % second_version_segs)
  69. for segment_name in first_version_segs:
  70. if segment_name in second_version_segs:
  71. # Good: an ancient version seg "survived":
  72. break
  73. else:
  74. raise RuntimeError('index has no first_version segs left')
  75. for segment_name in second_version_segs:
  76. if segment_name not in first_version_segs:
  77. # Good: a second_version segment was written
  78. break
  79. else:
  80. raise RuntimeError('index has no second_version segs left')
  81. create_bwc_index.shutdown_node(node)
  82. print('%s server output:\n%s' % (second_version, node.stdout.read().decode('utf-8')))
  83. node = None
  84. create_bwc_index.compress_index('%s-and-%s' % (first_version, second_version), tmp_dir, 'src/test/resources/org/elasticsearch/rest/action/admin/indices/upgrade')
  85. finally:
  86. if node is not None:
  87. create_bwc_index.shutdown_node(node)
  88. shutil.rmtree(tmp_dir)
  89. if __name__ == '__main__':
  90. main()