<br />
<b>Warning</b>:  Undefined array key "global_protection_id" in <b>/home/wikitechy/public_html/interview-questions/wp-content/plugins/content-protector/inc/class-ps-rest-handler.php</b> on line <b>51</b><br />
{"id":579,"date":"2021-07-13T21:50:56","date_gmt":"2021-07-13T21:50:56","guid":{"rendered":"https:\/\/www.wikitechy.com\/interview-questions\/?p=579"},"modified":"2021-09-13T05:15:57","modified_gmt":"2021-09-13T05:15:57","slug":"what-is-best-practice-indexing-hdfs-data-into-solr-using-hive","status":"publish","type":"post","link":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/","title":{"rendered":"What is best practice indexing hdfs data into solr using hive ?"},"content":{"rendered":"<div class=\"TextHeading\">\n<div class=\"hddn\">\n<h2 id=\"best-practice-indexing-hdfs-data-into-solr-using-hive\" class=\"color-green\" style=\"text-align: justify;\">Best practice indexing hdfs data into solr using hive<\/h2>\n<\/div>\n<\/div>\n<div><img fetchpriority=\"high\" decoding=\"async\" class=\"aligncenter size-medium\" src=\"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png\" alt=\"partitionned table in hive\" width=\"602\" height=\"331\" \/><\/div>\n<div class=\"ImageContent\" style=\"text-align: justify;\">\n<div class=\"hddn\">Here,based on the requirement especially how typically your data gets updated, volume and architecture.<\/div>\n<\/div>\n<div class=\"Content\" style=\"text-align: justify;\">\n<div class=\"hddn\">\n<ul>\n<li>Run a MR job to index data using solrj.<\/li>\n<li>Create Lucene index using mr job and duplicate to the appropriate shards.<\/li>\n<li>Use Hbase indexer to populate Solr.<\/li>\n<\/ul>\n<\/div>\n<\/div>\n<div class=\"TextHeading\" style=\"text-align: justify;\">\n<div class=\"hddn\">\n<h2 id=\"properly-size-index\" class=\"color-green\">Properly Size Index:<\/h2>\n<\/div>\n<\/div>\n<div class=\"Content\">\n<div class=\"hddn\">\n<ul>\n<li style=\"text-align: justify;\">Understanding what to index typically requires deep business domain expertise on the data.<\/li>\n<li style=\"text-align: justify;\">This yields better indexing plan and increases accuracy for searching data.<\/li>\n<li style=\"text-align: justify;\">Not all data will be indexed but for an organization user have new data,Needs classification of all data untill it is understood what value it brings to the business.<\/li>\n<li style=\"text-align: justify;\">It implies is that data needs to be re-indexed so it is a good practice to store raw data somewhere low cost, often in HDFS or in the cloud object storage.<\/li>\n<\/ul>\n<\/div>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>Answer : Here,based on the requirement especially how typically your data gets updated, volume and architecture.<\/p>\n","protected":false},"author":2,"featured_media":0,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"passster_activate_protection":false,"passster_protect_child_pages":"","passster_protection_type":"password","passster_password":"","passster_activate_overwrite_defaults":"","passster_headline":"","passster_instruction":"","passster_placeholder":"","passster_button":"","passster_id":"","passster_activate_misc_settings":"","passster_redirect_url":"","passster_hide":"no","passster_area_shortcode":"","gtb_hide_title":false,"gtb_wrap_title":false,"gtb_class_title":"","gtb_remove_headerfooter":false,"footnotes":""},"categories":[3782],"tags":[195,971,3799,3904,3908,203,199,214,3909,3901,209,205,222,484,621,620,3905,196,3716,3907,712,970,366,477,208,288,483,3903,3902,3906,3900,976,975,200,974,197,280,364,968,216,2119,969],"class_list":["post-579","post","type-post","status-publish","format-standard","hentry","category-hive","tag-accenture-interview-questions-and-answers","tag-altimetrik-india-pvt-ltd-interview-questions-and-answers","tag-ani-technologies-pvt-ltd-interview-questions-and-answers","tag-apache-solr-analytics","tag-can-we-update-data-in-hadoop","tag-capgemini-interview-questions-and-answers","tag-casting-networks-india-pvt-limited-interview-questions-and-answers","tag-cgi-group-inc-interview-questions-and-answers","tag-change-data-capture-in-hive-example","tag-cloudera-solr-tutorial","tag-collabera-technologies-interview-questions-and-answers","tag-dell-international-services-india-pvt-ltd-interview-questions-and-answers","tag-flipkart-interview-questions-and-answers","tag-genpact-interview-questions-and-answers","tag-hive-query-based-interview-questions","tag-hive-scenario-based-interview-questions","tag-how-would-you-load-incremental-data-into-hive","tag-ibm-interview-questions-and-answers","tag-impetus-technologies-interview-questions-and-answers","tag-implementing-change-data-capture-using-hive","tag-indiabulls-technology-solutions-ltd-interview-questions-and-answers","tag-mindtree-interview-questions-and-answers","tag-netapp-interview-questions-and-answers","tag-pig-interview-questions","tag-prokarma-softech-pvt-ltd-interview-questions-and-answers","tag-r-systems-interview-questions-and-answers","tag-reliance-industries-ltd-interview-questions-and-answers","tag-solr-analytics-component","tag-solr-hadoop-example","tag-solr-hadoop-integration-example","tag-solr-index-hdfs-files","tag-synechron-te-interview-questions-and-answers","tag-tata-consultancy-service-interview-questions-and-answers","tag-tech-mahindra-interview-questions-and-answers","tag-trigent-software-interview-questions-and-answers","tag-unitedhealth-group-interview-questions-and-answers","tag-virtusa-consulting-services-pvt-ltd-interview-questions-and-answers","tag-wells-fargo-interview-questions-and-answers","tag-wipro-infotech-interview-questions-and-answers","tag-wipro-interview-questions-and-answers","tag-yash-technologies-interview-questions-and-answers","tag-yodlee-infotech-pvt-ltd-interview-questions-and-answers"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v22.6 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>What is best practice indexing hdfs data into solr using hive ?<\/title>\n<meta name=\"description\" content=\"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.\" \/>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"What is best practice indexing hdfs data into solr using hive ?\" \/>\n<meta property=\"og:description\" content=\"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.\" \/>\n<meta property=\"og:url\" content=\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/\" \/>\n<meta property=\"og:site_name\" content=\"Wikitechy\" \/>\n<meta property=\"article:published_time\" content=\"2021-07-13T21:50:56+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2021-09-13T05:15:57+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png\" \/>\n<meta name=\"author\" content=\"Editor\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Written by\" \/>\n\t<meta name=\"twitter:data1\" content=\"Editor\" \/>\n\t<meta name=\"twitter:label2\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data2\" content=\"1 minute\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"WebPage\",\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/\",\"url\":\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/\",\"name\":\"What is best practice indexing hdfs data into solr using hive ?\",\"isPartOf\":{\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/#website\"},\"primaryImageOfPage\":{\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage\"},\"image\":{\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png\",\"datePublished\":\"2021-07-13T21:50:56+00:00\",\"dateModified\":\"2021-09-13T05:15:57+00:00\",\"author\":{\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/4d5a581fb5470d1560324bddc5e8b757\"},\"description\":\"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.\",\"inLanguage\":\"en-US\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"en-US\",\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage\",\"url\":\"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png\",\"contentUrl\":\"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png\"},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/#website\",\"url\":\"https:\/\/www.wikitechy.com\/interview-questions\/\",\"name\":\"Wikitechy\",\"description\":\"Interview Questions\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/www.wikitechy.com\/interview-questions\/?s={search_term_string}\"},\"query-input\":\"required name=search_term_string\"}],\"inLanguage\":\"en-US\"},{\"@type\":\"Person\",\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/4d5a581fb5470d1560324bddc5e8b757\",\"name\":\"Editor\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"en-US\",\"@id\":\"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/secure.gravatar.com\/avatar\/e9531079fe7e07841b7b156c04d65e5f39d4adfd18b6ffe3edfff8ca5aab85b5?s=96&d=mm&r=g\",\"contentUrl\":\"https:\/\/secure.gravatar.com\/avatar\/e9531079fe7e07841b7b156c04d65e5f39d4adfd18b6ffe3edfff8ca5aab85b5?s=96&d=mm&r=g\",\"caption\":\"Editor\"},\"url\":\"https:\/\/www.wikitechy.com\/interview-questions\/author\/editor\/\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"What is best practice indexing hdfs data into solr using hive ?","description":"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/","og_locale":"en_US","og_type":"article","og_title":"What is best practice indexing hdfs data into solr using hive ?","og_description":"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.","og_url":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/","og_site_name":"Wikitechy","article_published_time":"2021-07-13T21:50:56+00:00","article_modified_time":"2021-09-13T05:15:57+00:00","og_image":[{"url":"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png"}],"author":"Editor","twitter_card":"summary_large_image","twitter_misc":{"Written by":"Editor","Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"WebPage","@id":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/","url":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/","name":"What is best practice indexing hdfs data into solr using hive ?","isPartOf":{"@id":"https:\/\/www.wikitechy.com\/interview-questions\/#website"},"primaryImageOfPage":{"@id":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage"},"image":{"@id":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage"},"thumbnailUrl":"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png","datePublished":"2021-07-13T21:50:56+00:00","dateModified":"2021-09-13T05:15:57+00:00","author":{"@id":"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/4d5a581fb5470d1560324bddc5e8b757"},"description":"What is best practice indexing hdfs data into solr using hive - hive interview questions and answers - Run a MR job to index data using solr.","inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.wikitechy.com\/interview-questions\/hive\/what-is-best-practice-indexing-hdfs-data-into-solr-using-hive\/#primaryimage","url":"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png","contentUrl":"https:\/\/cdn.wikitechy.com\/interview-questions\/hive\/partitionned-table-in-hive.png"},{"@type":"WebSite","@id":"https:\/\/www.wikitechy.com\/interview-questions\/#website","url":"https:\/\/www.wikitechy.com\/interview-questions\/","name":"Wikitechy","description":"Interview Questions","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/www.wikitechy.com\/interview-questions\/?s={search_term_string}"},"query-input":"required name=search_term_string"}],"inLanguage":"en-US"},{"@type":"Person","@id":"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/4d5a581fb5470d1560324bddc5e8b757","name":"Editor","image":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/www.wikitechy.com\/interview-questions\/#\/schema\/person\/image\/","url":"https:\/\/secure.gravatar.com\/avatar\/e9531079fe7e07841b7b156c04d65e5f39d4adfd18b6ffe3edfff8ca5aab85b5?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/e9531079fe7e07841b7b156c04d65e5f39d4adfd18b6ffe3edfff8ca5aab85b5?s=96&d=mm&r=g","caption":"Editor"},"url":"https:\/\/www.wikitechy.com\/interview-questions\/author\/editor\/"}]}},"_links":{"self":[{"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/posts\/579","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/comments?post=579"}],"version-history":[{"count":3,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/posts\/579\/revisions"}],"predecessor-version":[{"id":3456,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/posts\/579\/revisions\/3456"}],"wp:attachment":[{"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/media?parent=579"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/categories?post=579"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.wikitechy.com\/interview-questions\/wp-json\/wp\/v2\/tags?post=579"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}