

{"id":2559,"date":"2017-05-08T13:12:42","date_gmt":"2017-05-08T13:12:42","guid":{"rendered":"http:\/\/data-flair.training\/blogs\/?p=2559"},"modified":"2019-05-10T17:00:29","modified_gmt":"2019-05-10T11:30:29","slug":"how-hadoop-mapreduce-works","status":"publish","type":"post","link":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/","title":{"rendered":"How Hadoop MapReduce Works &#8211; MapReduce Tutorial"},"content":{"rendered":"<div class='__iawmlf-post-loop-links' style='display:none;' data-iawmlf-post-links='[{&quot;id&quot;:2355,&quot;href&quot;:&quot;https:\\\/\\\/techvidvan.com\\\/tutorials\\\/hadoop-partitioner-introduction&quot;,&quot;archived_href&quot;:&quot;http:\\\/\\\/web-wp.archive.org\\\/web\\\/20250213040210\\\/https:\\\/\\\/techvidvan.com\\\/tutorials\\\/hadoop-partitioner-introduction\\\/&quot;,&quot;redirect_href&quot;:&quot;&quot;,&quot;checks&quot;:[{&quot;date&quot;:&quot;2025-12-11 04:17:39&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2025-12-14 09:45:53&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2025-12-19 00:34:28&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2025-12-23 08:34:07&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2025-12-26 13:04:53&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2025-12-30 00:07:48&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-02 17:54:47&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-07 03:21:22&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-10 17:49:41&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-14 18:49:26&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-18 15:24:09&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-24 11:44:59&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-28 08:23:44&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-01-31 09:13:29&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-03 23:18:27&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-07 15:35:40&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-12 05:56:10&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-15 06:48:52&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-18 10:01:24&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-21 17:33:19&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-02-25 06:21:46&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-01 06:21:48&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-04 11:32:45&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-07 16:50:43&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-10 17:18:46&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-14 10:57:02&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-18 14:30:57&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-22 12:28:03&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-26 05:04:11&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-03-30 07:40:54&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-04 12:00:59&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-07 13:33:42&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-10 15:34:06&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-14 16:37:45&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-19 22:20:25&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-23 10:37:28&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-27 03:01:08&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-04-30 04:40:33&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-04 08:33:41&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-10 16:54:34&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-15 13:23:53&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-19 14:33:04&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-23 10:14:54&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-26 11:47:10&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-05-30 17:36:25&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-06-03 02:44:33&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-06-08 04:19:57&quot;,&quot;http_code&quot;:403},{&quot;date&quot;:&quot;2026-06-12 11:03:57&quot;,&quot;http_code&quot;:403}],&quot;broken&quot;:true,&quot;last_checked&quot;:{&quot;date&quot;:&quot;2026-06-12 11:03:57&quot;,&quot;http_code&quot;:403},&quot;process&quot;:&quot;done&quot;},{&quot;id&quot;:2356,&quot;href&quot;:&quot;https:\\\/\\\/hadoop.apache.org\\\/docs\\\/r1.2.1\\\/mapred_tutorial.html&quot;,&quot;archived_href&quot;:&quot;http:\\\/\\\/web-wp.archive.org\\\/web\\\/20251006081236\\\/https:\\\/\\\/hadoop.apache.org\\\/docs\\\/r1.2.1\\\/mapred_tutorial.html&quot;,&quot;redirect_href&quot;:&quot;&quot;,&quot;checks&quot;:[{&quot;date&quot;:&quot;2025-12-11 04:17:43&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2025-12-14 14:12:45&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2025-12-23 08:39:57&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2025-12-28 10:51:22&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-02 17:54:50&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-07 03:21:22&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-11 14:22:42&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-14 18:52:31&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-18 15:24:11&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-24 11:45:02&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-01-29 07:41:42&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-02 23:30:25&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-06 06:42:43&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-09 07:37:12&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-13 10:20:07&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-17 17:30:25&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-21 17:33:53&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-02-25 06:21:48&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-01 09:12:49&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-04 11:32:48&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-07 16:50:44&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-14 10:57:04&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-18 14:32:56&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-22 12:28:04&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-26 05:04:13&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-03-30 07:41:54&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-04 12:01:02&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-07 13:34:32&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-10 15:34:07&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-14 16:37:53&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-19 22:20:27&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-23 10:37:33&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-04-29 04:43:48&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-05-04 08:33:42&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-05-10 16:54:37&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-05-16 20:49:49&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-05-21 16:08:34&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-05-29 11:36:51&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-06-01 16:34:56&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-06-08 18:30:12&quot;,&quot;http_code&quot;:206},{&quot;date&quot;:&quot;2026-06-12 11:03:59&quot;,&quot;http_code&quot;:206}],&quot;broken&quot;:false,&quot;last_checked&quot;:{&quot;date&quot;:&quot;2026-06-12 11:03:59&quot;,&quot;http_code&quot;:206},&quot;process&quot;:&quot;done&quot;}]'><\/div>\n<h2>1. Objective<\/h2>\n<p><strong>MapReduce<\/strong> is the core component of <a href=\"http:\/\/data-flair.training\/blogs\/hadoop-tutorial-for-beginners\/\"><strong>Hadoop<\/strong><\/a> that process huge amount of data in parallel by dividing the work into a set of independent tasks. In MapReduce data flow in step by step from Mapper to Reducer. In this tutorial, we are going to cover how Hadoop MapReduce works internally?<\/p>\n<p>This blog on Hadoop\u00a0MapReduce\u00a0data flow will provide you the complete MapReduce data flow chart in Hadoop. The tutorial covers various phases of MapReduce job execution such as\u00a0<strong>Input Files<\/strong>,<strong> InputFormat in Hadoop<\/strong>,<strong> InputSplits<\/strong>,<strong> RecordReader<\/strong>,<strong> Mapper<\/strong>,<strong> Combiner<\/strong>,<strong> Partitioner<\/strong>,<strong> Shuffling and Sorting<\/strong>,<strong> Reducer<\/strong>,<strong> RecordWriter and OutputFormat<\/strong> in detail. We will also learn How Hadoop MapReduce works with the help of all these phases.<\/p>\n<div id=\"attachment_42333\" style=\"width: 1210px\" class=\"wp-caption aligncenter\"><a href=\"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg\"><img loading=\"lazy\" decoding=\"async\" aria-describedby=\"caption-attachment-42333\" class=\"size-full wp-image-42333\" src=\"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg\" alt=\"How Hadoop MapReduce Works - MapReduce Tutorial\" width=\"1200\" height=\"628\" srcset=\"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg 1200w, https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1-150x79.jpg 150w, https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1-300x157.jpg 300w, https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1-768x402.jpg 768w, https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1-1024x536.jpg 1024w, https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1-520x272.jpg 520w\" sizes=\"auto, (max-width: 1200px) 100vw, 1200px\" \/><\/a><p id=\"caption-attachment-42333\" class=\"wp-caption-text\">How Hadoop MapReduce Works &#8211; MapReduce Tutorial<\/p><\/div>\n<h2>2. What is MapReduce?<\/h2>\n<p><strong>MapReduce<\/strong> is the data processing layer of Hadoop. It is a software framework for easily writing applications that process the vast amount of structured and unstructured data stored in the <strong><a href=\"http:\/\/data-flair.training\/blogs\/comprehensive-hdfs-guide-introduction-architecture-data-read-write-tutorial\/\">Hadoop Distributed Filesystem (HDFS)<\/a><\/strong>. It processes the huge amount of data in parallel by dividing the job (submitted job) into a set of independent tasks (sub-job). By this parallel processing speed and reliability of cluster is improved. We just need to put the custom code (business logic) in the way map reduce works and rest things will be taken care by the engine.<\/p>\n<h2>3. How Hadoop MapReduce Works?<\/h2>\n<p>In Hadoop, MapReduce works by breaking the data processing into two phases: Map phase and Reduce phase. The map is the first phase of processing, where we specify all the complex logic\/business rules\/costly code. Reduce is the second phase of processing, where we specify light-weight processing like aggregation\/summation.<\/p>\n<h2>4. MapReduce Flow Chart<\/h2>\n<p>Now let us see How Hadoop MapReduce works by understanding the end to end Hadoop MapReduce job execution flow with components in detail:<\/p>\n<h3>4.1. Input Files<\/h3>\n<p>The data for a MapReduce task is stored in <strong>input files<\/strong>, and input files typically lives in <strong>HDFS<\/strong>. The format of these files is arbitrary, while line-based log files and binary format can also be used.<\/p>\n<h3>4.2. InputFormat<\/h3>\n<p>Now, <strong>InputFormat<\/strong> defines how these input files are split and read. It selects the files or other objects that are used for input. InputFormat creates InputSplit. <a href=\"http:\/\/data-flair.training\/blogs\/hadoop-inputformat-types\/\">Learn MapReduce InputFormat in detail.<\/a><\/p>\n<h3>4.3. InputSplits<\/h3>\n<p>It is created by InputFormat, logically represent the data which will be processed by an individual <strong>Mapper\u00a0<\/strong>(We will understand mapper below). One map task is created for each split; thus the number of map tasks will be equal to the number of InputSplits. The split is divided into records and each record will be processed by the mapper. <a href=\"http:\/\/data-flair.training\/blogs\/inputsplit-in-hadoop-mapreduce\/\">Learn MapReduce InputSplit in detail.<\/a><\/p>\n<h3>4.4. RecordReader<\/h3>\n<p>It communicates with the <strong>InputSplit<\/strong> in Hadoop MapReduce and converts the data into key-value pairs suitable for reading by the mapper. By default, it uses TextInputFormat for converting data into a key-value pair. RecordReader communicates with the InputSplit until the file reading is not completed. It assigns byte offset (unique number) to each line present in the file. Further, these key-value pairs are sent to the mapper for further processing.<\/p>\n<h3>4.5. Mapper<\/h3>\n<p>It processes each input record (from RecordReader) and generates new key-value pair, and this key-value pair generated by Mapper is completely different from the input pair. The output of Mapper is also known as intermediate output which is written to the local disk. The output of the Mapper is not stored on HDFS as this is temporary data and writing on HDFS will create unnecessary copies (also HDFS is a high latency system). Mappers output is passed to the combiner for further process<\/p>\n<p>Follow this link to learn <a href=\"http:\/\/data-flair.training\/blogs\/hadoop-hdfs-data-read-and-write-operations\/\">Data read and write operation in HDFS.<\/a><\/p>\n<h3>4.6. Combiner<\/h3>\n<p>The combiner is also known as \u2018Mini-reducer\u2019. Hadoop MapReduce Combiner performs local aggregation on the mappers&#8217; output, which helps to minimize the data transfer between mapper and <strong>reducer<\/strong>\u00a0(we will see reducer below). Once the combiner functionality is executed, the output is then passed to the partitioner for further work. <a href=\"http:\/\/data-flair.training\/blogs\/combiner-in-hadoop-mapreduce-advantages-disadvantages\/\">Learn MapReduce Combiner in detail.<\/a><\/p>\n<h3>4.7. Partitioner<\/h3>\n<p>Hadoop MapReduce,\u00a0<strong>Partitioner<\/strong> comes into the picture if we are working on more than one reducer (for one reducer partitioner is not used).<\/p>\n<p>Partitioner takes the output from combiners and performs partitioning. Partitioning of output takes place on the basis of the key and then sorted. By hash function, key (or a subset of the key) is used to derive the partition.<\/p>\n<p>According to the key value in MapReduce, each combiner output is partitioned, and a record having the same key value goes into the same partition, and then each partition is sent to a reducer. Partitioning allows even distribution of the map output over the reducer. <a href=\"https:\/\/techvidvan.com\/tutorials\/hadoop-partitioner-introduction\/\">Learn MapReduce Partitioner in detail<\/a>.<\/p>\n<h3>4.8. Shuffling and Sorting<\/h3>\n<p>Now, the output is Shuffled to the reduce node (which is a normal slave node but reduce phase will run here hence called as reducer node). The shuffling is the physical movement of the data which is done over the network. Once all the mappers are finished and their output is shuffled on the reducer nodes, then this intermediate output is merged and sorted, which is then provided as input to reduce phase.<\/p>\n<h3>4.9. Reducer<\/h3>\n<p>It takes the set of intermediate key-value pairs produced by the mappers as the input and then runs a reducer function on each of them to generate the output. The output of the reducer is the final output, which is stored in HDFS. Follow this link to <a href=\"http:\/\/data-flair.training\/blogs\/reducer-in-hadoop-mapreduce\/\">learn about Reducer in detail.<\/a><\/p>\n<h3>4.10. RecordWriter<\/h3>\n<p>It writes these output key-value pair from the Reducer phase to the output files.<\/p>\n<h3>4.11. OutputFormat<\/h3>\n<p>The way these output key-value pairs are written in output files by RecordWriter is determined by the OutputFormat. OutputFormat instances provided by the Hadoop are used to <a href=\"http:\/\/data-flair.training\/blogs\/hdfs-data-write-operation\/\">write files in HDFS<\/a> or on the local disk. Thus the final output of reducer is written on HDFS by OutputFormat instances.<\/p>\n<p>Hence, in this manner, a Hadoop MapReduce works over the cluster.<\/p>\n<h2>5. Conclusion<\/h2>\n<p>In conclusion, we can say that data flow in MapReduce is the combination of different processing phases of such as Input Files, InputFormat in Hadoop, InputSplits, RecordReader, Mapper, Combiner, Partitioner, Shuffling and Sorting, Reducer, RecordWriter, and OutputFormat. Hence all these components play an important role in the Hadoop mapreduce working.<\/p>\n<p>Since you understand the end to end Mapreduce job flow, test your knowledge by playing the <a href=\"http:\/\/data-flair.training\/blogs\/category\/quiz\/\"><strong>Hadoop Quiz<\/strong>.<\/a><br \/>\nIf you like this blog or have any query to understand how Hadoop MapReduce works, so leave a comment in a section below. We will be glad to solve them.<\/p>\n<p><strong>See Also-<\/strong><\/p>\n<ul>\n<li><a href=\"http:\/\/data-flair.training\/blogs\/mapreduce-job-optimization-performance-tuning-techniques\/\">MapReduce\u00a0job optimization and performance tuning techniques.<\/a><\/li>\n<li><a href=\"http:\/\/data-flair.training\/blogs\/data-locality-hadoop-mapreduce\/\">Hadoop Data Locality\u00a0<\/a><\/li>\n<\/ul>\n<p><a href=\"https:\/\/hadoop.apache.org\/docs\/r1.2.1\/mapred_tutorial.html\">Reference<\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>1. Objective MapReduce is the core component of Hadoop that process huge amount of data in parallel by dividing the work into a set of independent tasks. In MapReduce data flow in step by&#46;&#46;&#46;<\/p>\n","protected":false},"author":6,"featured_media":42333,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[37],"tags":[3312,5237,5286,8539,8540,8543,12732],"class_list":["post-2559","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-mapreduce","tag-data-flow-in-hadoop-mapreduce","tag-hadoop-data-flow","tag-hadoop-mapreduce-gdata-flow","tag-mapreduce-data-flow","tag-mapreduce-data-flow-internals","tag-mapreduce-flow-chart","tag-sequence-of-mapreduce-flow"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v27.4 - https:\/\/yoast.com\/product\/yoast-seo-wordpress\/ -->\n<title>How Hadoop MapReduce Works - MapReduce Tutorial - DataFlair<\/title>\n<meta name=\"description\" content=\"Hadoop MapReduce data flow cover how Hadoop MapReduce works,How Mapreduce process data,MapReduce job execution phases-Mapper,Reducer,combiner,partitioner...\" \/>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"How Hadoop MapReduce Works - MapReduce Tutorial - DataFlair\" \/>\n<meta property=\"og:description\" content=\"Hadoop MapReduce data flow cover how Hadoop MapReduce works,How Mapreduce process data,MapReduce job execution phases-Mapper,Reducer,combiner,partitioner...\" \/>\n<meta property=\"og:url\" content=\"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/\" \/>\n<meta property=\"og:site_name\" content=\"DataFlair\" \/>\n<meta property=\"article:publisher\" content=\"https:\/\/www.facebook.com\/DataFlairWS\/\" \/>\n<meta property=\"article:published_time\" content=\"2017-05-08T13:12:42+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2019-05-10T11:30:29+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg\" \/>\n\t<meta property=\"og:image:width\" content=\"1200\" \/>\n\t<meta property=\"og:image:height\" content=\"628\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/jpeg\" \/>\n<meta name=\"author\" content=\"DataFlair Team\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:creator\" content=\"@DataFlairWS\" \/>\n<meta name=\"twitter:site\" content=\"@DataFlairWS\" \/>\n<meta name=\"twitter:label1\" content=\"Written by\" \/>\n\t<meta name=\"twitter:data1\" content=\"DataFlair Team\" \/>\n\t<meta name=\"twitter:label2\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data2\" content=\"5 minutes\" \/>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"How Hadoop MapReduce Works - MapReduce Tutorial - DataFlair","description":"Hadoop MapReduce data flow cover how Hadoop MapReduce works,How Mapreduce process data,MapReduce job execution phases-Mapper,Reducer,combiner,partitioner...","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/","og_locale":"en_US","og_type":"article","og_title":"How Hadoop MapReduce Works - MapReduce Tutorial - DataFlair","og_description":"Hadoop MapReduce data flow cover how Hadoop MapReduce works,How Mapreduce process data,MapReduce job execution phases-Mapper,Reducer,combiner,partitioner...","og_url":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/","og_site_name":"DataFlair","article_publisher":"https:\/\/www.facebook.com\/DataFlairWS\/","article_published_time":"2017-05-08T13:12:42+00:00","article_modified_time":"2019-05-10T11:30:29+00:00","og_image":[{"width":1200,"height":628,"url":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg","type":"image\/jpeg"}],"author":"DataFlair Team","twitter_card":"summary_large_image","twitter_creator":"@DataFlairWS","twitter_site":"@DataFlairWS","twitter_misc":{"Written by":"DataFlair Team","Est. reading time":"5 minutes"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#article","isPartOf":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/"},"author":{"name":"DataFlair Team","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/person\/2c58ecb4f73a39f0ef993f1ddfcd7b89"},"headline":"How Hadoop MapReduce Works &#8211; MapReduce Tutorial","datePublished":"2017-05-08T13:12:42+00:00","dateModified":"2019-05-10T11:30:29+00:00","mainEntityOfPage":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/"},"wordCount":1100,"commentCount":5,"publisher":{"@id":"https:\/\/data-flair.training\/blogs\/#organization"},"image":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#primaryimage"},"thumbnailUrl":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg","keywords":["Data flow in hadoop Mapreduce","Hadoop data flow","hadoop Mapreduce gdata flow","MapReduce Data Flow","MapReduce data flow internals","Mapreduce flow chart","sequence of mapReduce flow"],"articleSection":["MapReduce Tutorials"],"inLanguage":"en-US","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#respond"]}]},{"@type":"WebPage","@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/","url":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/","name":"How Hadoop MapReduce Works - MapReduce Tutorial - DataFlair","isPartOf":{"@id":"https:\/\/data-flair.training\/blogs\/#website"},"primaryImageOfPage":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#primaryimage"},"image":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#primaryimage"},"thumbnailUrl":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg","datePublished":"2017-05-08T13:12:42+00:00","dateModified":"2019-05-10T11:30:29+00:00","description":"Hadoop MapReduce data flow cover how Hadoop MapReduce works,How Mapreduce process data,MapReduce job execution phases-Mapper,Reducer,combiner,partitioner...","breadcrumb":{"@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#primaryimage","url":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg","contentUrl":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2017\/05\/mapreduce-job-execution-flow-1-1024x492-1.jpg","width":1200,"height":628,"caption":"How Hadoop MapReduce Works - MapReduce Tutorial"},{"@type":"BreadcrumbList","@id":"https:\/\/data-flair.training\/blogs\/how-hadoop-mapreduce-works\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Blog Home","item":"https:\/\/data-flair.training\/blogs\/"},{"@type":"ListItem","position":2,"name":"MapReduce Tutorials","item":"https:\/\/data-flair.training\/blogs\/category\/mapreduce\/"},{"@type":"ListItem","position":3,"name":"How Hadoop MapReduce Works &#8211; MapReduce Tutorial"}]},{"@type":"WebSite","@id":"https:\/\/data-flair.training\/blogs\/#website","url":"https:\/\/data-flair.training\/blogs\/","name":"DataFlair","description":"Learn Today. Lead Tomorrow.","publisher":{"@id":"https:\/\/data-flair.training\/blogs\/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/data-flair.training\/blogs\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https:\/\/data-flair.training\/blogs\/#organization","name":"DataFlair","url":"https:\/\/data-flair.training\/blogs\/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/logo\/image\/","url":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2016\/07\/Data-Flair.png","contentUrl":"https:\/\/data-flair.training\/blogs\/wp-content\/uploads\/sites\/2\/2016\/07\/Data-Flair.png","width":106,"height":48,"caption":"DataFlair"},"image":{"@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/logo\/image\/"},"sameAs":["https:\/\/www.facebook.com\/DataFlairWS\/","https:\/\/x.com\/DataFlairWS","https:\/\/www.linkedin.com\/company\/dataflair-web-services-pvt-ltd\/","https:\/\/www.youtube.com\/user\/DataFlairWS"]},{"@type":"Person","@id":"https:\/\/data-flair.training\/blogs\/#\/schema\/person\/2c58ecb4f73a39f0ef993f1ddfcd7b89","name":"DataFlair Team","image":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/secure.gravatar.com\/avatar\/1ce4a0e3e542444fc73bbebf83e89e8b73e2d95ccb1fcee64da9945f078b97c5?s=96&d=mm&r=g","url":"https:\/\/secure.gravatar.com\/avatar\/1ce4a0e3e542444fc73bbebf83e89e8b73e2d95ccb1fcee64da9945f078b97c5?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/1ce4a0e3e542444fc73bbebf83e89e8b73e2d95ccb1fcee64da9945f078b97c5?s=96&d=mm&r=g","caption":"DataFlair Team"},"description":"The DataFlair Team provides industry-driven content on programming, Java, Python, C++, DSA, AI, ML, data Science, Android, Flutter, MERN, Web Development, and technology. Our expert educators focus on delivering value-packed, easy-to-follow resources for tech enthusiasts and professionals.","url":"https:\/\/data-flair.training\/blogs\/author\/dfteam2\/"}]}},"amp_enabled":true,"_links":{"self":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/2559","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/users\/6"}],"replies":[{"embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/comments?post=2559"}],"version-history":[{"count":5,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/2559\/revisions"}],"predecessor-version":[{"id":56086,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/posts\/2559\/revisions\/56086"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/media\/42333"}],"wp:attachment":[{"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/media?parent=2559"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/categories?post=2559"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/data-flair.training\/blogs\/wp-json\/wp\/v2\/tags?post=2559"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}