create_bwc_index_with_some_ancient_segments.py 4.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115
  1. import create_bwc_index
  2. import logging
  3. import os
  4. import random
  5. import shutil
  6. import subprocess
  7. import sys
  8. import tempfile
  9. def fetch_version(version):
  10. logging.info('fetching ES version %s' % version)
  11. if subprocess.call([sys.executable, os.path.join(os.path.split(sys.argv[0])[0], 'get-bwc-version.py'), version]) != 0:
  12. raise RuntimeError('failed to download ES version %s' % version)
  13. def main():
  14. '''
  15. Creates a static back compat index (.zip) with mixed 0.20 (Lucene 3.x) and 0.90 (Lucene 4.x) segments.
  16. '''
  17. logging.basicConfig(format='[%(levelname)s] [%(asctime)s] %(message)s', level=logging.INFO,
  18. datefmt='%Y-%m-%d %I:%M:%S %p')
  19. logging.getLogger('elasticsearch').setLevel(logging.ERROR)
  20. logging.getLogger('urllib3').setLevel(logging.WARN)
  21. tmp_dir = tempfile.mkdtemp()
  22. try:
  23. data_dir = os.path.join(tmp_dir, 'data')
  24. repo_dir = os.path.join(tmp_dir, 'repo')
  25. logging.info('Temp data dir: %s' % data_dir)
  26. logging.info('Temp repo dir: %s' % repo_dir)
  27. first_version = '0.20.6'
  28. second_version = '0.90.6'
  29. index_name = 'index-%s-and-%s' % (first_version, second_version)
  30. # Download old ES releases if necessary:
  31. release_dir = os.path.join('backwards', 'elasticsearch-%s' % first_version)
  32. if not os.path.exists(release_dir):
  33. fetch_version(first_version)
  34. node = create_bwc_index.start_node(first_version, release_dir, data_dir, repo_dir, cluster_name=index_name)
  35. client = create_bwc_index.create_client()
  36. # Creates the index & indexes docs w/ first_version:
  37. create_bwc_index.generate_index(client, first_version, index_name)
  38. # Make sure we write segments:
  39. flush_result = client.indices.flush(index=index_name)
  40. if not flush_result['ok']:
  41. raise RuntimeError('flush failed: %s' % str(flush_result))
  42. segs = client.indices.segments(index=index_name)
  43. shards = segs['indices'][index_name]['shards']
  44. if len(shards) != 1:
  45. raise RuntimeError('index should have 1 shard but got %s' % len(shards))
  46. first_version_segs = shards['0'][0]['segments'].keys()
  47. create_bwc_index.shutdown_node(node)
  48. print('%s server output:\n%s' % (first_version, node.stdout.read().decode('utf-8')))
  49. node = None
  50. release_dir = os.path.join('backwards', 'elasticsearch-%s' % second_version)
  51. if not os.path.exists(release_dir):
  52. fetch_version(second_version)
  53. # Now also index docs with second_version:
  54. node = create_bwc_index.start_node(second_version, release_dir, data_dir, repo_dir, cluster_name=index_name)
  55. client = create_bwc_index.create_client()
  56. # If we index too many docs, the random refresh/flush causes the ancient segments to be merged away:
  57. num_docs = 10
  58. create_bwc_index.index_documents(client, index_name, 'doc', num_docs)
  59. # Make sure we get a segment:
  60. flush_result = client.indices.flush(index=index_name)
  61. if not flush_result['ok']:
  62. raise RuntimeError('flush failed: %s' % str(flush_result))
  63. # Make sure we see mixed segments (it's possible Lucene could have "accidentally" merged away the first_version segments):
  64. segs = client.indices.segments(index=index_name)
  65. shards = segs['indices'][index_name]['shards']
  66. if len(shards) != 1:
  67. raise RuntimeError('index should have 1 shard but got %s' % len(shards))
  68. second_version_segs = shards['0'][0]['segments'].keys()
  69. #print("first: %s" % first_version_segs)
  70. #print("second: %s" % second_version_segs)
  71. for segment_name in first_version_segs:
  72. if segment_name in second_version_segs:
  73. # Good: an ancient version seg "survived":
  74. break
  75. else:
  76. raise RuntimeError('index has no first_version segs left')
  77. for segment_name in second_version_segs:
  78. if segment_name not in first_version_segs:
  79. # Good: a second_version segment was written
  80. break
  81. else:
  82. raise RuntimeError('index has no second_version segs left')
  83. create_bwc_index.shutdown_node(node)
  84. print('%s server output:\n%s' % (second_version, node.stdout.read().decode('utf-8')))
  85. node = None
  86. create_bwc_index.compress_index('%s-and-%s' % (first_version, second_version), tmp_dir, 'core/src/test/resources/org/elasticsearch/action/admin/indices/upgrade')
  87. finally:
  88. if node is not None:
  89. create_bwc_index.shutdown_node(node)
  90. shutil.rmtree(tmp_dir)
  91. if __name__ == '__main__':
  92. main()