8f56f2711b5b1653f60d009d6f642cb653c20462,perfkitbenchmarker/benchmarks/cloudsuite_web_search.py,,_BuildIndex,#Any#Any#,80

Before Change


  Downloads data and builds Solr index from it.
  indexer.Install("nutch")
  hadoop_tmp_dir = posixpath.join(indexer.GetScratchDir(), "hadoop_tmp")
  indexer.RemoteCommand("cd {0} && "
                        "wget {1} && "
                        "mkdir -p {4} && "
                        "sed -i "/<value>http/c\\<value>http://{2}:"
                        "{3}/solr/cloudsuite_web_search</value>" "
                        "nutch-site.xml && "
                        "sed -i "s/HADOOP_TMP_DIR/{4}/g" nutch-site.xml".format(
                            CLOUDSUITE_WEB_SEARCH_DIR,
                            NUTCH_SITE_URL, solr_node.ip_address,
                            SOLR_PORT, re.escape(hadoop_tmp_dir)))
  stdout, _ = indexer.RemoteCommand("cd {0} && "
                                    "cat nutch-site.xml".format(
                                        CLOUDSUITE_WEB_SEARCH_DIR))
  nutch.ConfigureNutchSite(indexer, stdout.replace(""", "\\""))
  scratch_dir = indexer.GetScratchDir()
  indexer.RobustRemoteCommand("cd {0} && "
                              "wget {1}  && "

After Change


                     "tar zxvf index -C {2}".format(
                         solr_core_dir, INDEX_URL, "cloudsuite_web_search*"))

  vm_util.RunThreaded(DownloadIndex, solr_nodes, len(solr_nodes))
  server_heap_size = FLAGS.server_heap_size
  for vm in solr_nodes:
    if vm == solr_nodes[0]:
      solr.StartWithZookeeper(vm, fw, SOLR_PORT, server_heap_size, False)
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 3

Instances


Project Name: GoogleCloudPlatform/PerfKitBenchmarker
Commit Name: 8f56f2711b5b1653f60d009d6f642cb653c20462
Time: 2015-09-11
Author: vukasin.stefanovic92@gmail.com
File Name: perfkitbenchmarker/benchmarks/cloudsuite_web_search.py
Class Name:
Method Name: _BuildIndex


Project Name: GoogleCloudPlatform/PerfKitBenchmarker
Commit Name: 2713875d877199782b0ced85148fc488481f1ede
Time: 2015-11-25
Author: connormccoy@google.com
File Name: perfkitbenchmarker/linux_benchmarks/mongodb_ycsb_benchmark.py
Class Name:
Method Name: Cleanup


Project Name: GoogleCloudPlatform/PerfKitBenchmarker
Commit Name: 6e9565285f181f4737ba19f504d076b96dd7eb39
Time: 2015-11-25
Author: connormccoy@google.com
File Name: perfkitbenchmarker/linux_benchmarks/aerospike_benchmark.py
Class Name:
Method Name: Cleanup


Project Name: GoogleCloudPlatform/PerfKitBenchmarker
Commit Name: 8f56f2711b5b1653f60d009d6f642cb653c20462
Time: 2015-09-11
Author: vukasin.stefanovic92@gmail.com
File Name: perfkitbenchmarker/benchmarks/cloudsuite_web_search.py
Class Name:
Method Name: _BuildIndex