19:["$","div",null,{"className":"bg-theme dark:bg-gray-1400 h-dvh w-dvw flex flex-col","children":[["$","a",null,{"href":"#main-content","className":"absolute left-4 top-0 focus-visible:top-4 bg-blue-700 text-white rounded-4 text-xs p-4 z-50 transform -translate-y-full focus-visible:translate-y-0 otransition","children":"Skip to main content"}],"$L36","$L37",["$","div",null,{"role":"main","id":"main-content","className":"relative overflow-y-auto items-center flex flex-col","tabIndex":-1,"children":[["$","div",null,{"className":"max-w-[62.5rem] w-full pt-24 lg:pt-48 px-20 md:px-24","children":["$","$L38",null,{"rootHref":"/learn/course-paths?courseSlug=advanced-real-life-concurrency-challenges&unitSlug=building-a-concurrent-log-file-analysis-framework","pathBreadcrumb":{"key":"139","title":"Applying Advanced Java Concurrency to Real-Life","href":"/learn/paths/applying-advanced-java-concurrency-utils-to-real-life"},"courseBreadcrumb":{"key":"654","title":"Advanced Real-Life Concurrency Challenges","href":"/learn/courses/advanced-real-life-concurrency-challenges","options":[{"key":"651","href":"/learn/courses/advanced-asynchronous-programming-in-java","imageUrl":"https://d3dq4v2xxejk8c.cloudfront.net/uploads/112fcd54-0e5f-493f-b69d-8e5388f226af_optimized.jpg","numLessons":5,"numPractices":26,"active":false,"label":"Advanced Asynchronous Programming in Java","completedAt":"$undefined","completionRatio":"$undefined"},{"key":"652","href":"/learn/courses/advanced-concurrency-utilities","imageUrl":"https://d3dq4v2xxejk8c.cloudfront.net/uploads/711a0036-3099-4ede-af40-373cebd6451b_optimized.jpg","numLessons":5,"numPractices":22,"active":false,"label":"Advanced Concurrency Utilities","completedAt":"$undefined","completionRatio":"$undefined"},{"key":"653","href":"/learn/courses/mastering-java-concurrency-with-practice","imageUrl":"https://d3dq4v2xxejk8c.cloudfront.net/uploads/ba03d49e-b3b3-435a-9acb-74ea1d357f0f_optimized.jpg","numLessons":5,"numPractices":20,"active":false,"label":"Mastering Java Concurrency with Practice","completedAt":"$undefined","completionRatio":"$undefined"},{"key":"654","href":"/learn/courses/advanced-real-life-concurrency-challenges","imageUrl":"https://d3dq4v2xxejk8c.cloudfront.net/uploads/83bf7355-c5e7-4979-ad9e-c671282c2097_optimized.jpg","numLessons":6,"numPractices":24,"active":true,"label":"Advanced Real-Life Concurrency Challenges","completedAt":"$undefined","completionRatio":"$undefined"}]},"lessonBreadcrumb":{"key":"4455","title":"Building a Concurrent Log File Analysis Framework","options":[{"key":"4450","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/multi-threaded-download-manager-with-resource-limiting","active":false,"label":"Multi-Threaded Download Manager with Resource Limiting","completedAt":"$undefined"},{"key":"4451","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/designing-a-concurrent-garbage-collector-simulation","active":false,"label":"Designing a Concurrent Garbage Collector Simulation","completedAt":"$undefined"},{"key":"4452","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/concurrent-image-processing-pipeline","active":false,"label":"Concurrent Image Processing Pipeline","completedAt":"$undefined"},{"key":"4453","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/implementing-a-thread-safe-lru-cache-with-high-concurrency","active":false,"label":"Implementing a Thread-Safe LRU Cache with High Concurrency","completedAt":"$undefined"},{"key":"4454","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/implementing-a-parallel-merge-sort-with-phaser","active":false,"label":"Implementing a Parallel Merge Sort with Phaser","completedAt":"$undefined"},{"key":"4455","href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/building-a-concurrent-log-file-analysis-framework","active":true,"label":"Building a Concurrent Log File Analysis Framework","completedAt":"$undefined"}]}}]}],["$","div",null,{"className":"max-w-[62.5rem] w-full pt-24 pb-60 px-20 md:px-24 space-y-32 md:space-y-48","children":[["$","div",null,{"className":"mx-auto h-[12rem] w-[21.25rem] md:h-[25.5rem] md:w-[45rem] lg:h-[33.5rem] lg:w-[59.5rem] shrink-0","children":["$","$L39",null,{"src":"https://k3-production-bucket.s3.amazonaws.com/uploads/b4bcb5f2-f4fb-413f-a6d2-06b883b906eb_combined_video.mp4","thumbnailUrl":"https://k3-production-bucket.s3.amazonaws.com/uploads/100d1342-6032-48df-b9fc-d340183cfca3_slide-1.png","mimeType":"video/mp4","speed":1,"forcePause":false}]}],[["$","div","21830",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Building a Concurrent Log File Analysis Framework"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["Welcome back! In our previous lesson, we ventured into parallel algorithms and their applications. We now shift our focus another practical challenge: building a ",["$","strong","strong-0",{"children":"Concurrent Log File Analysis Framework"}],". This task requires you to integrate various concurrency utilities in ",["$","strong","strong-1",{"children":"Java"}]," to process large log datasets effectively. If you recall from previous lessons on handling data with parallel merge sort and LRU caches, the skills acquired will now help you manage concurrency in real-world applications like log file analysis."]}]]}]]}],["$","div","21831",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"What You'll Learn"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":"In this lesson, we focus on enhancing your ability to:"}],"\n",["$","ul","ul-0",{"className":"list-disc pl-16 space-y-8","children":["\n",["$","li","li-0",{"children":"Develop a concurrent framework using advanced asynchronous programming."}],"\n",["$","li","li-1",{"children":"Synchronize multiple tasks and phases effectively."}],"\n",["$","li","li-2",{"children":"Handle complex data dependencies with ease."}],"\n"]}],"\n",["$","p","p-1",{"children":"Through this lesson, you will understand how to utilize concurrency techniques to efficiently analyze and process large datasets, a crucial skill in today’s data-driven world."}]]}]]}],["$","div","21832",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Understanding the Concurrent Log File Analysis Framework"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["Log file analysis is a common challenge in software development, especially for systems generating large volumes of log data. The goal is to create a framework that can concurrently process these logs to extract meaningful information, such as counting occurrences of specific log levels (",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"ERROR"}],", ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"WARN"}],", ",["$","code","code-2",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"INFO"}],"). To achieve this, you'll employ a ",["$","strong","strong-0",{"children":"map-reduce approach"}],":"]}],"\n",["$","ul","ul-0",{"className":"list-disc pl-16 space-y-8","children":["\n",["$","li","li-0",{"children":[["$","strong","strong-0",{"children":"Map Phase"}],": Each file is independently parsed, and relevant data (log level counts) is extracted."]}],"\n",["$","li","li-1",{"children":[["$","strong","strong-0",{"children":"Reduce Phase"}],": Combine results from all files to get a consolidated view of the data."]}],"\n"]}],"\n",["$","p","p-1",{"children":"This approach not only improves performance by leveraging multiple CPU cores but also ensures scalability."}]]}]]}],["$","div","21833",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Map Phase"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["Let's start by handling the ",["$","strong","strong-0",{"children":"Map Phase"}],", where each log file is independently processed to extract log level frequencies."]}],"\n",["$","div","pre-0",{"className":"my-24","children":["$","$L3a",null,{"language":"java","onClickPlay":"$undefined","display":"block","children":"import java.nio.file.Files;\nimport java.nio.file.Path;\nimport java.util.Arrays;\nimport java.util.HashMap;\nimport java.util.Map;\n\npublic class LogFileAnalyzer {\n public Map mapPhase(Path file) {\n try {\n System.out.println(\"Analyzing file: \" + file.getFileName());\n String content = Files.readString(file);\n Map logCounts = new HashMap<>();\n Arrays.stream(content.split(\"\\\\s+\"))\n .filter(log -> log.matches(\"ERROR|WARN|INFO\"))\n .forEach(log -> logCounts.merge(log, 1, Integer::sum));\n return logCounts;\n } catch (IOException e) {\n throw new RuntimeException(\"Failed to read file: \" + file.getFileName(), e);\n }\n }\n}"}]}],"\n",["$","p","p-1",{"children":["In this section, the ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"mapPhase"}]," method extracts log level information from a file. It reads the file content, splits it into tokens, and counts occurrences of ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"ERROR"}],", ",["$","code","code-2",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"WARN"}],", and ",["$","code","code-3",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"INFO"}],". This operation uses ",["$","strong","strong-0",{"children":"Java’s stream API"}]," for efficient processing, making the code concise and expressive. The method returns a map of log levels and their counts for each file."]}]]}]]}],["$","div","21834",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Reduce Phase"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["After independently analyzing each file, the next step consolidates the results from all files, known as the ",["$","strong","strong-0",{"children":"Reduce Phase"}],"."]}],"\n",["$","div","pre-0",{"className":"my-24","children":["$","$L3a",null,{"language":"java","onClickPlay":"$undefined","display":"block","children":"public void reducePhase(Map finalResult, Map logCounts) {\n logCounts.forEach((logLevel, count) -> finalResult.merge(logLevel, count, Integer::sum));\n}"}]}],"\n",["$","p","p-1",{"children":["The ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"reducePhase"}]," method merges the counts from individual files into a comprehensive result. It updates the ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"finalResult"}]," map by adding the counts from each file's analysis. The ",["$","code","code-2",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"merge"}]," method ensures that log levels are safely aggregated, with no race conditions, making it thread-safe even when concurrent updates are made."]}]]}]]}],["$","div","21835",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Starting the Log Analysis"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["The ",["$","strong","strong-0",{"children":"startLogAnalysis"}]," method handles the overall process of mapping and reducing in a concurrent environment. We'll split it into two parts for clarity."]}]]}]]}],["$","div","21836",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Map Phase in startLogAnalysis"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["In the ",["$","strong","strong-0",{"children":"map phase"}],", each file is processed concurrently to extract log level data."]}],"\n",["$","div","pre-0",{"className":"my-24","children":["$","$L3a",null,{"language":"java","onClickPlay":"$undefined","display":"block","children":"public void startLogAnalysis() throws InterruptedException, ExecutionException {\n ExecutorService executor = Executors.newFixedThreadPool(4);\n Map finalResult = new ConcurrentHashMap<>();\n\n LogFileAnalyzer logFileAnalyzer = new LogFileAnalyzer();\n\n // Map Phase\n List>> mapFutures = files.stream()\n .map(file -> CompletableFuture.supplyAsync(() -> logFileAnalyzer.mapPhase(Paths.get(file)), executor))\n .collect(Collectors.toList());\n}"}]}],"\n",["$","p","p-1",{"children":["In this part of the ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"startLogAnalysis"}]," method, we create a fixed thread pool using ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"ExecutorService"}]," to manage the concurrent processing. Each log file is analyzed in parallel using ",["$","strong","strong-0",{"children":["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"CompletableFuture.supplyAsync()"}]}],", which allows for non-blocking execution of tasks. The list ",["$","code","code-2",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"mapFutures"}]," holds the future results of each asynchronous task (i.e., the log counts from each file). This phase efficiently leverages multithreading to handle large datasets."]}]]}]]}],["$","div","21837",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Reduce Phase in startLogAnalysis"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["After the map phase is complete, we proceed to the ",["$","strong","strong-0",{"children":"reduce phase"}],"."]}],"\n",["$","div","pre-0",{"className":"my-24","children":["$","$L3a",null,{"language":"java","onClickPlay":"$undefined","display":"block","children":" // Combine map futures into a single future\n CompletableFuture allMapFutures = CompletableFuture.allOf(\n mapFutures.toArray(new CompletableFuture[0])\n );\n\n // Reduce Phase\n CompletableFuture reduceFuture = allMapFutures.thenRunAsync(() -> {\n mapFutures.forEach(future -> {\n try {\n Map logCounts = future.get();\n logFileAnalyzer.reducePhase(finalResult, logCounts);\n } catch (InterruptedException | ExecutionException e) {\n System.err.println(\"Error during reduce phase: \" + e.getMessage());\n }\n });\n }, executor);\n \n // Wait for reduce phase to complete\n reduceFuture.get();\n\n executor.shutdown();\n executor.awaitTermination(1, TimeUnit.MINUTES);\n}"}]}],"\n",["$","p","p-1",{"children":["The reduce phase starts by combining all ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"CompletableFuture"}]," objects using ",["$","strong","strong-0",{"children":["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"CompletableFuture.allOf()"}]}]," to ensure that all map tasks complete before proceeding. Once all map tasks finish, the reduce phase aggregates the log counts from each file. Using ",["$","strong","strong-1",{"children":["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"thenRunAsync()"}]}],", we initiate the reduce phase in a non-blocking manner and collect the final results in a ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"ConcurrentHashMap"}],". This map stores the total counts of each log level across all log files."]}]]}]]}],["$","div","21838",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Running the Application"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["The ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"main()"}]," method orchestrates the execution of the log analysis by calling ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"startLogAnalysis()"}],"."]}],"\n",["$","div","pre-0",{"className":"my-24","children":["$","$L3a",null,{"language":"java","onClickPlay":"$undefined","display":"block","children":"public class Main {\n\n private static final List files = Arrays.asList(\"logs/file1.log\", \"logs/file2.log\", \"logs/file3.log\");\n\n public static void main(String[] args) {\n try {\n new Main().startLogAnalysis();\n } catch (InterruptedException | ExecutionException e) {\n e.printStackTrace();\n }\n }\n}"}]}],"\n",["$","p","p-1",{"children":["The ",["$","code","code-0",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"main()"}]," method simply initializes the log file paths and starts the log analysis by invoking the ",["$","code","code-1",{"className":"px-4 py-2 rounded-4 bg-theme-strong dark:bg-theme-medium text-code-lg","style":{"fontVariantLigatures":"none"},"children":"startLogAnalysis()"}]," method. It handles any exceptions that occur during execution and ensures the analysis runs smoothly."]}]]}]]}],["$","div","21839",{"className":"space-y-32","children":[["$","div",null,{"className":"text-h-md text-theme-strong","children":"Why It Matters"}],["$","div",null,{"className":"space-y-24 text-lg text-theme","children":[["$","p","p-0",{"children":["Developing a ",["$","strong","strong-0",{"children":"Concurrent Log File Analysis Framework"}]," is crucial as it reflects real-world applications where high-volume data processing is essential. By effectively using concurrency:"]}],"\n",["$","ul","ul-0",{"className":"list-disc pl-16 space-y-8","children":["\n",["$","li","li-0",{"children":[["$","strong","strong-0",{"children":"Efficiency is improved"}],", allowing for faster processing of large datasets."]}],"\n",["$","li","li-1",{"children":[["$","strong","strong-0",{"children":"Scalability is ensured"}],", making it feasible to handle increasing log volumes."]}],"\n",["$","li","li-2",{"children":[["$","strong","strong-0",{"children":"Readability is enhanced"}]," with structured and parallelized code, reducing complexity."]}],"\n"]}],"\n",["$","p","p-1",{"children":"Now that we've covered the fundamental concepts and shown you how to implement a concurrent log analysis framework, you're ready to apply these concepts to real-world problems. Let's proceed to the practice section to solidify your understanding and skills!"}]]}]]}]],["$","div",null,{"className":"flex gap-16 justify-between md:justify-start","children":[[["$","div",null,{"className":"hidden md:block","children":["$","$L10",null,{"href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/implementing-a-parallel-merge-sort-with-phaser","variant":"tertiary","size":"sm","LeadingIcon":"$3b","children":"Previous Lesson"}]}],["$","div",null,{"className":"md:hidden","children":["$","$L10",null,{"href":"/learn/courses/advanced-real-life-concurrency-challenges/lessons/implementing-a-parallel-merge-sort-with-phaser","variant":"tertiary","size":"sm","LeadingIcon":"$3b","children":"Previous"}]}]],null]}]]}],["$","div",null,{"className":"flex flex-col bg-gray-200 dark:bg-gray-1400 w-full px-20 md:px-24 pt-24 pb-48 items-center","children":["$","div",null,{"className":"max-w-screen-xl w-full flex flex-col lg:flex-row py-20 px-24 items-center justify-between gap-48 lg:gap-60 xl:gap-96","children":[["$","$L3c",null,{"alt":"Sign up","src":"/learn/img/signup-module.png","className":"h-auto w-[335px] md:w-[440px] lg:w-[480px] xl:w-[570px]","width":570,"height":336}],["$","div",null,{"className":"flex flex-col gap-32 ml-24 items-center lg:items-start","children":[["$","div",null,{"className":"text-h-md md:text-h-xl text-theme-strong text-center lg:text-start","children":"Join the 1M+ learners on CodeSignal"}],["$","div",null,{"className":"text-lg font-normal md:text-2xl text-theme text-center lg:text-start md:max-w-[536px] lg:max-w-none","children":"Be a part of our community of 1M+ users who develop and demonstrate their skills on CodeSignal"}],["$","$L35",null,{"size":"lg","pageType":"lessonPreview","uiRegion":"joinModule","children":"Start learning today!"}]]}]]}]}],"$L3d"]}]]}]