diff --git a/hadoop-common-project/hadoop-common/CHANGES.txt b/hadoop-common-project/hadoop-common/CHANGES.txt index 995965c730f..b90573e7607 100644 --- a/hadoop-common-project/hadoop-common/CHANGES.txt +++ b/hadoop-common-project/hadoop-common/CHANGES.txt @@ -22,18 +22,18 @@ Trunk (Unreleased) (Dexter Bradshaw, Mostafa Elhemali, Xi Fang, Johannes Klein, David Lao, Mike Liddell, Chuan Liu, Lengning Liu, Ivan Mitic, Michael Rys, Alexander Stojanovich, Brian Swan, and Min Wei via cnauroth) - + IMPROVEMENTS HADOOP-8017. Configure hadoop-main pom to get rid of M2E plugin execution not covered (Eric Charles via bobby) - HADOOP-8015. ChRootFileSystem should extend FilterFileSystem + HADOOP-8015. ChRootFileSystem should extend FilterFileSystem (Daryn Sharp via bobby) HADOOP-7595. Upgrade dependency to Avro 1.5.3. (Alejandro Abdelnur via atm) - HADOOP-8078. Add capability to turn on security in unit tests. (Jaimin + HADOOP-8078. Add capability to turn on security in unit tests. (Jaimin Jetly via jitendra) HADOOP-7757. Test file reference count is at least 3x actual value (Jon @@ -89,7 +89,7 @@ Trunk (Unreleased) HADOOP-8776. Provide an option in test-patch that can enable/disable compiling native code. (Chris Nauroth via suresh) - HADOOP-6616. Improve documentation for rack awareness. (Adam Faris via + HADOOP-6616. Improve documentation for rack awareness. (Adam Faris via jghoman) HADOOP-9075. FileContext#FSLinkResolver should be made static. @@ -105,7 +105,7 @@ Trunk (Unreleased) HADOOP-8844. Add a plaintext fs -text test-case. (Akira AJISAKA via harsh) - HADOOP-9432 Add support for markdown .md files in site documentation + HADOOP-9432 Add support for markdown .md files in site documentation (stevel) HADOOP-9186. test-patch.sh should report build failure to JIRA. @@ -138,14 +138,14 @@ Trunk (Unreleased) HADOOP-11025. hadoop-daemons.sh should just call hdfs directly (Masatake Iwasaki via aw) - HADOOP-11150. hadoop command should show the reason on failure by + HADOOP-11150. hadoop command should show the reason on failure by invalid COMMAND or CLASSNAME (Masatake Iwasaki via aw) HADOOP-11208. Replace "daemon" with better name in script subcommands (aw) HADOOP-10926. Improve smart-apply-patch.sh to apply binary diffs (cmccabe) - HADOOP-11081. Document hadoop properties expected to be set by the shell + HADOOP-11081. Document hadoop properties expected to be set by the shell code in *-env.sh (aw) BUG FIXES @@ -155,7 +155,7 @@ Trunk (Unreleased) HADOOP-8419. Fixed GzipCode NPE reset for IBM JDK. (Yu Li via eyang) - HADOOP-8177. MBeans shouldn't try to register when it fails to create + HADOOP-8177. MBeans shouldn't try to register when it fails to create MBeanName. (Devaraj K via umamahesh) HADOOP-8018. Hudson auto test for HDFS has started throwing javadoc @@ -168,11 +168,11 @@ Trunk (Unreleased) HADOOP-7621. alfredo config should be in a file not readable by users (Alejandro Abdelnur via atm) - - HADOOP-7669 Fix newly introduced release audit warning. + + HADOOP-7669 Fix newly introduced release audit warning. (Uma Maheswara Rao G via stevel) - - HADOOP-6220. HttpServer wraps InterruptedExceptions by IOExceptions + + HADOOP-6220. HttpServer wraps InterruptedExceptions by IOExceptions if interrupted in startup (stevel) HADOOP-7703. Improved exception handling of shutting down web server. @@ -183,7 +183,7 @@ Trunk (Unreleased) HADOOP-7769. TestJMXJsonServlet is failing. (tomwhite) - HADOOP-7770. ViewFS getFileChecksum throws FileNotFoundException for files in + HADOOP-7770. ViewFS getFileChecksum throws FileNotFoundException for files in /tmp and /user. (Ravi Prakash via jitendra) HADOOP-8141. Add method to SecurityUtil to init krb5 cipher suites. @@ -194,7 +194,7 @@ Trunk (Unreleased) HADOOP-8312. testpatch.sh should provide a simpler way to see which warnings changed (bobby) - HADOOP-8339. jenkins complaining about 16 javadoc warnings + HADOOP-8339. jenkins complaining about 16 javadoc warnings (Tom White and Robert Evans via tgraves) HADOOP-8354. test-patch findbugs may fail if a dependent module is changed @@ -243,7 +243,7 @@ Trunk (Unreleased) HADOOP-8818. Use equals instead == in MD5MD5CRC32FileChecksum and TFileDumper. (Brandon Li via suresh) - HADOOP-8821. Fix findbugs warning related to concatenating string in a + HADOOP-8821. Fix findbugs warning related to concatenating string in a for loop in Configuration#dumpDeprecatedKeys(). (suresh) HADOOP-7256. Resource leak during failure scenario of closing @@ -274,7 +274,7 @@ Trunk (Unreleased) HADOOP-9037. Bug in test-patch.sh and precommit build process (Kihwal Lee via jlowe) - HADOOP-9121. InodeTree.java has redundant check for vName while + HADOOP-9121. InodeTree.java has redundant check for vName while throwing exception. (Arup Malakar via suresh) HADOOP-9131. Turn off TestLocalFileSystem#testListStatusWithColons on @@ -339,12 +339,12 @@ Trunk (Unreleased) HADOOP-11033. shell scripts ignore JAVA_HOME on OS X. (aw) - HADOOP-11052. hadoop_verify_secure_prereq's results aren't checked + HADOOP-11052. hadoop_verify_secure_prereq's results aren't checked in bin/hdfs (aw) HADOOP-11055. non-daemon pid files are missing (aw) - HADOOP-11022. User replaced functions get lost 2-3 levels deep (e.g., + HADOOP-11022. User replaced functions get lost 2-3 levels deep (e.g., sbin) (aw) HADOOP-11248. Add hadoop configuration to disable Azure Filesystem metrics @@ -404,9 +404,6 @@ Release 2.7.0 - UNRELEASED HADOOP-11341. KMS support for whitelist key ACLs. (Arun Suresh via wang) - HADOOP-11301. [optionally] update jmx cache to drop old metrics - (Maysam Yabandeh via stack) - OPTIMIZATIONS HADOOP-11323. WritableComparator#compare keeps reference to byte array. @@ -531,7 +528,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-10610. Upgrade S3n s3.fs.buffer.dir to support multi directories. (Ted Malaska via atm) - HADOOP-10817. ProxyUsers configuration should support configurable + HADOOP-10817. ProxyUsers configuration should support configurable prefixes. (tucu) HADOOP-10755. Support negative caching of user-group mapping. @@ -555,13 +552,13 @@ Release 2.6.0 - 2014-11-18 HADOOP-10903. Enhance hadoop classpath command to expand wildcards or write classpath into jar manifest. (cnauroth) - HADOOP-10791. AuthenticationFilter should support externalizing the + HADOOP-10791. AuthenticationFilter should support externalizing the secret for signing and provide rotation support. (rkanter via tucu) - HADOOP-10771. Refactor HTTP delegation support out of httpfs to common. + HADOOP-10771. Refactor HTTP delegation support out of httpfs to common. (tucu) - HADOOP-10835. Implement HTTP proxyuser support in HTTP authentication + HADOOP-10835. Implement HTTP proxyuser support in HTTP authentication client/server libraries. (tucu) HADOOP-10820. Throw an exception in GenericOptionsParser when passed @@ -570,10 +567,10 @@ Release 2.6.0 - 2014-11-18 HADOOP-10281. Create a scheduler, which assigns schedulables a priority level. (Chris Li via Arpit Agarwal) - HADOOP-8944. Shell command fs -count should include human readable option + HADOOP-8944. Shell command fs -count should include human readable option (Jonathan Allen via aw) - HADOOP-10231. Add some components in Native Libraries document (Akira + HADOOP-10231. Add some components in Native Libraries document (Akira AJISAKA via aw) HADOOP-10650. Add ability to specify a reverse ACL (black list) of users @@ -622,12 +619,12 @@ Release 2.6.0 - 2014-11-18 HADOOP-10698. KMS, add proxyuser support. (tucu) - HADOOP-8896. Javadoc points to Wrong Reader and Writer classes + HADOOP-8896. Javadoc points to Wrong Reader and Writer classes in SequenceFile (Ray Chiang via aw) HADOOP-10998. Fix bash tab completion code to work (Jim Hester via aw) - HADOOP-10880. Move HTTP delegation tokens out of URL querystring to + HADOOP-10880. Move HTTP delegation tokens out of URL querystring to a header. (tucu) HADOOP-11005. Fix HTTP content type for ReconfigurationServlet. @@ -636,26 +633,26 @@ Release 2.6.0 - 2014-11-18 HADOOP-10814. Update Tomcat version used by HttpFS and KMS to latest 6.x version. (rkanter via tucu) - HADOOP-10994. KeyProviderCryptoExtension should use CryptoCodec for + HADOOP-10994. KeyProviderCryptoExtension should use CryptoCodec for generation/decryption of keys. (tucu) HADOOP-11021. Configurable replication factor in the hadoop archive command. (Zhe Zhang via wang) - HADOOP-11030. Define a variable jackson.version instead of using constant + HADOOP-11030. Define a variable jackson.version instead of using constant at multiple places. (Juan Yu via kasha) HADOOP-10990. Add missed NFSv3 request and response classes (brandonli) - HADOOP-10863. KMS should have a blacklist for decrypting EEKs. + HADOOP-10863. KMS should have a blacklist for decrypting EEKs. (asuresh via tucu) HADOOP-11054. Add a KeyProvider instantiation based on a URI. (tucu) - HADOOP-11015. Http server/client utils to propagate and recreate + HADOOP-11015. Http server/client utils to propagate and recreate Exceptions from server to client. (tucu) - HADOOP-11060. Create a CryptoCodec test that verifies interoperability + HADOOP-11060. Create a CryptoCodec test that verifies interoperability between the JCE and OpenSSL implementations. (hitliuyi via tucu) HADOOP-11070. Create MiniKMS for testing. (tucu) @@ -676,7 +673,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-11091. Eliminate old configuration parameter names from s3a (David S. Wang via Colin Patrick McCabe) - HADOOP-10868. AuthenticationFilter should support externalizing the + HADOOP-10868. AuthenticationFilter should support externalizing the secret for signing and provide rotation support. (rkanter via tucu) HADOOP-10922. User documentation for CredentialShell. (Larry McCay via wang) @@ -688,7 +685,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-10970. Cleanup KMS configuration keys. (wang) - HADOOP-11017. KMS delegation token secret manager should be able to use + HADOOP-11017. KMS delegation token secret manager should be able to use zookeeper as store. (asuresh via tucu) HADOOP-11009. Add Timestamp Preservation to DistCp (Gary Steelman via aw) @@ -699,10 +696,10 @@ Release 2.6.0 - 2014-11-18 HADOOP-8808. Update FsShell documentation to mention deprecation of some of the commands, and mention alternatives (Akira AJISAKA via aw) - HADOOP-10954. Adding site documents of hadoop-tools (Masatake Iwasaki + HADOOP-10954. Adding site documents of hadoop-tools (Masatake Iwasaki via aw) - HADOOP-10731. Remove @date JavaDoc comment in ProgramDriver class (Henry + HADOOP-10731. Remove @date JavaDoc comment in ProgramDriver class (Henry Saputra via aw) HADOOP-11153. Make number of KMS threads configurable. (wang) @@ -837,7 +834,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-10927. Fix CredentialShell help behavior and error codes. (Josh Elser via wang) - HADOOP-10933. FileBasedKeyStoresFactory Should use Configuration.getPassword + HADOOP-10933. FileBasedKeyStoresFactory Should use Configuration.getPassword for SSL Passwords. (lmccay via tucu) HADOOP-10759. Remove hardcoded JAVA_HEAP_MAX. (Sam Liu via Eric Yang) @@ -881,7 +878,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-10972. Native Libraries Guide contains mis-spelt build line (Peter Klavins via aw) - HADOOP-10873. Fix dead link in Configuration javadoc (Akira AJISAKA + HADOOP-10873. Fix dead link in Configuration javadoc (Akira AJISAKA via aw) HADOOP-10968. hadoop native build fails to detect java_libarch on @@ -987,54 +984,54 @@ Release 2.6.0 - 2014-11-18 Windows. (Varun Vasudev via wheat9) BREAKDOWN OF HDFS-6134 AND HADOOP-10150 SUBTASKS AND RELATED JIRAS - + HADOOP-10734. Implement high-performance secure random number sources. (Yi Liu via Colin Patrick McCabe) - + HADOOP-10603. Crypto input and output streams implementing Hadoop stream interfaces. (Yi Liu and Charles Lamb) - + HADOOP-10628. Javadoc and few code style improvement for Crypto input and output streams. (Yi Liu via clamb) - - HADOOP-10632. Minor improvements to Crypto input and output streams. + + HADOOP-10632. Minor improvements to Crypto input and output streams. (Yi Liu) - + HADOOP-10635. Add a method to CryptoCodec to generate SRNs for IV. (Yi Liu) - - HADOOP-10653. Add a new constructor for CryptoInputStream that + + HADOOP-10653. Add a new constructor for CryptoInputStream that receives current position of wrapped stream. (Yi Liu) - + HADOOP-10662. NullPointerException in CryptoInputStream while wrapped stream is not ByteBufferReadable. Add tests using normal stream. (Yi Liu) - - HADOOP-10713. Refactor CryptoCodec#generateSecureRandom to take a byte[]. + + HADOOP-10713. Refactor CryptoCodec#generateSecureRandom to take a byte[]. (wang via yliu) - - HADOOP-10693. Implementation of AES-CTR CryptoCodec using JNI to OpenSSL. + + HADOOP-10693. Implementation of AES-CTR CryptoCodec using JNI to OpenSSL. (Yi Liu via cmccabe) - + HADOOP-10803. Update OpensslCipher#getInstance to accept CipherSuite#name format. (Yi Liu) - + HADOOP-10735. Fall back AesCtrCryptoCodec implementation from OpenSSL to JCE if non native support. (Yi Liu) - + HADOOP-10870. Failed to load OpenSSL cipher error logs on systems with old openssl versions (cmccabe) - + HADOOP-10853. Refactor get instance of CryptoCodec and support create via algorithm/mode/padding. (Yi Liu) - + HADOOP-10919. Copy command should preserve raw.* namespace extended attributes. (clamb) - + HDFS-6873. Constants in CommandWithDestination should be static. (clamb) - + HADOOP-10871. incorrect prototype in OpensslSecureRandom.c (cmccabe) - - HADOOP-10886. CryptoCodec#getCodecclasses throws NPE when configurations not - loaded. (umamahesh) + + HADOOP-10886. CryptoCodec#getCodecclasses throws NPE when configurations not + loaded. (umamahesh) -- HADOOP-10911. hadoop.auth cookie after HADOOP-10710 still not proper @@ -1065,13 +1062,13 @@ Release 2.6.0 - 2014-11-18 HADOOP-11077. NPE if hosts not specified in ProxyUsers. (gchanan via tucu) - HADOOP-9989. Bug introduced in HADOOP-9374, which parses the -tokenCacheFile + HADOOP-9989. Bug introduced in HADOOP-9374, which parses the -tokenCacheFile as binary file but set it to the configuration as JSON file. (zxu via tucu) HADOOP-11085. Excessive logging by org.apache.hadoop.util.Progress when value is NaN (Mit Desai via jlowe) - HADOOP-11083. After refactoring of HTTP proxyuser to common, doAs param is + HADOOP-11083. After refactoring of HTTP proxyuser to common, doAs param is case sensitive. (tucu) HADOOP-11088. Unittest TestKeyShell, TestCredShell and TestKMS assume UNIX @@ -1083,7 +1080,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-11097. kms docs say proxyusers, not proxyuser for config params. (clamb via tucu) - HADOOP-11062. CryptoCodec testcases requiring OpenSSL should be run + HADOOP-11062. CryptoCodec testcases requiring OpenSSL should be run only if -Pnative is used. (asuresh via tucu) HADOOP-11099. KMS return HTTP UNAUTHORIZED 401 on ACL failure. (tucu) @@ -1107,7 +1104,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-11048. user/custom LogManager fails to load if the client classloader is enabled (Sangjin Lee via jlowe) - HADOOP-10552. Fix usage and example at FileSystemShell.apt.vm (Kenji + HADOOP-10552. Fix usage and example at FileSystemShell.apt.vm (Kenji Kikushima via aw) HADOOP-11143 NetUtils.wrapException loses inner stack trace on BindException @@ -1139,7 +1136,7 @@ Release 2.6.0 - 2014-11-18 HADOOP-11228. Winutils task: unsecure path should not call AddNodeManagerAndUserACEsToObject. (Remus Rusanu via jianhe) - HADOOP-11170. ZKDelegationTokenSecretManager fails to renewToken created by + HADOOP-11170. ZKDelegationTokenSecretManager fails to renewToken created by a peer. (Arun Suresh and Gregory Chanan via kasha) HADOOP-11217. Disable SSLv3 in KMS. (Robert Kanter via kasha) @@ -1176,7 +1173,7 @@ Release 2.5.2 - 2014-11-19 NEW FEATURES IMPROVEMENTS - + OPTIMIZATIONS BUG FIXES @@ -1194,7 +1191,7 @@ Release 2.5.1 - 2014-09-05 NEW FEATURES IMPROVEMENTS - + HADOOP-10956. Fix create-release script to include docs and necessary txt files. (kasha) @@ -1248,7 +1245,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10471. Reduce the visibility of constants in ProxyUsers. (Benoy Antony via wheat9) - HADOOP-10556. Add toLowerCase support to auth_to_local rules + HADOOP-10556. Add toLowerCase support to auth_to_local rules for service name. (tucu) HADOOP-10467. Enable proxyuser specification to support list of users in @@ -1271,7 +1268,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10618. Remove SingleNodeSetup.apt.vm. (Akira Ajisaka via Arpit Agarwal) - HADOOP-9968. Makes ProxyUsers to work with NetGroups (Benoy Antony via + HADOOP-9968. Makes ProxyUsers to work with NetGroups (Benoy Antony via ddas) HADOOP-10448. Support pluggable mechanism to specify proxy user settings. @@ -1328,7 +1325,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-9651 Filesystems to throw FileAlreadyExistsException in createFile(path, overwrite=false) when the file exists (stevel) - + HADOOP-9495 Define behaviour of Seekable.seek(), write tests, fix all hadoop implementations for compliance @@ -1336,7 +1333,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10782. Fix typo in DataChecksum class. (Jingguo Yao via suresh) - HADOOP-10896. Update compatibility doc to capture visibility of + HADOOP-10896. Update compatibility doc to capture visibility of un-annotated classes/ methods. (kasha) OPTIMIZATIONS @@ -1344,7 +1341,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10674. Improve PureJavaCrc32 performance and use java.util.zip.CRC32 for Java 7 and above. (szetszwo) - BUG FIXES + BUG FIXES HADOOP-10378. Typo in help printed by hdfs dfs -help. (Mit Desai via suresh) @@ -1362,7 +1359,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10459. distcp V2 doesn't preserve root dir's attributes when -p is specified. (Yongjun Zhang via atm) - HADOOP-10462. DF#getFilesystem is not parsing the command output. + HADOOP-10462. DF#getFilesystem is not parsing the command output. (Akira AJISAKA via umamahesh) HADOOP-10468. TestMetricsSystemImpl.testMultiThreadedPublish fails @@ -1388,7 +1385,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-9919. Update hadoop-metrics2.properties examples to Yarn. (Akira AJISAKA via suresh) - HADOOP-10526. Chance for Stream leakage in CompressorStream. (Rushabh + HADOOP-10526. Chance for Stream leakage in CompressorStream. (Rushabh Shah via kihwal) HADOOP-10251. Both NameNodes could be in STANDBY State if SNN network is unstable @@ -1421,7 +1418,7 @@ Release 2.5.0 - 2014-08-11 (Ted Yu via cnauroth) HADOOP-10581. TestUserGroupInformation#testGetServerSideGroups fails - because groups stored in Set and ArrayList are compared. + because groups stored in Set and ArrayList are compared. (Mit Desai via kihwal) HADOOP-10585. Retry polices ignore interrupted exceptions (Daryn Sharp via @@ -1459,7 +1456,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10622. Shell.runCommand can deadlock (Gera Shegalov via jlowe) - HADOOP-10686. Writables are not always configured. + HADOOP-10686. Writables are not always configured. (Abraham Elmahrek via kasha) HADOOP-10678. SecurityUtil has unnecessary synchronization on collection @@ -1507,7 +1504,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10715. Remove public GraphiteSink#setWriter (Babak Behzad via raviprak) - HADOOP-10710. hadoop.auth cookie is not properly constructed according to + HADOOP-10710. hadoop.auth cookie is not properly constructed according to RFC2109. (Juan Yu via tucu) HADOOP-10864. Tool documentenation is broken. (Akira Ajisaka @@ -1545,7 +1542,7 @@ Release 2.5.0 - 2014-08-11 HADOOP-10561. Copy command with preserve option should handle Xattrs. (Yi Liu via cnauroth) -Release 2.4.1 - 2014-06-23 +Release 2.4.1 - 2014-06-23 INCOMPATIBLE CHANGES @@ -1558,7 +1555,7 @@ Release 2.4.1 - 2014-06-23 OPTIMIZATIONS - BUG FIXES + BUG FIXES HADOOP-10455. When there is an exception, ipc.Server should first check whether it is an terse exception. (szetszwo) @@ -1583,7 +1580,7 @@ Release 2.4.1 - 2014-06-23 in AbstractDelegationTokenSecretManager. (Suresh Srinivas via Arpit Agarwal) -Release 2.4.0 - 2014-04-07 +Release 2.4.0 - 2014-04-07 INCOMPATIBLE CHANGES @@ -1600,7 +1597,7 @@ Release 2.4.0 - 2014-04-07 HADOOP-10139. Update and improve the Single Cluster Setup document. (Akira Ajisaka via Arpit Agarwal) - HADOOP-10295. Allow distcp to automatically identify the checksum type of + HADOOP-10295. Allow distcp to automatically identify the checksum type of source files and use it for the target. (jing9 and Laurent Goujon) HADOOP-10333. Fix grammatical error in overview.html document. @@ -1645,7 +1642,7 @@ Release 2.4.0 - 2014-04-07 HADOOP-10015. UserGroupInformation prints out excessive warnings. (Nicolas Liochon via szetszwo) - HADOOP-10423. Clarify compatibility policy document for combination of + HADOOP-10423. Clarify compatibility policy document for combination of new client and old server. (Chris Nauroth via kasha) HADOOP-10280. Make Schedulables return a configurable identity of user @@ -1657,8 +1654,8 @@ Release 2.4.0 - 2014-04-07 HADOOP-10320. Javadoc in InterfaceStability.java lacks final . (René Nyffenegger via cnauroth) - - HADOOP-10085. CompositeService should allow adding services while being + + HADOOP-10085. CompositeService should allow adding services while being inited. (Steve Loughran via kasha) HADOOP-10327. Trunk windows build broken after HDFS-5746. @@ -1697,7 +1694,7 @@ Release 2.4.0 - 2014-04-07 HADOOP-10395. TestCallQueueManager is flaky. (Arpit Agarwal) HADOOP-10394. TestAuthenticationFilter is flaky. (Arpit Agarwal) - + HADOOP-10337 ConcurrentModificationException from MetricsDynamicMBeanBase.createMBeanInfo() (Liang Xie via stack) @@ -1782,7 +1779,7 @@ Release 2.3.1 - UNRELEASED OPTIMIZATIONS - BUG FIXES + BUG FIXES Release 2.3.0 - 2014-02-18 @@ -1804,10 +1801,10 @@ Release 2.3.0 - 2014-02-18 HADOOP-9623 Update jets3t dependency to 0.9.0. (Amandeep Khurana via Colin Patrick McCabe) - HADOOP-10132. RPC#stopProxy() should log the class of proxy when IllegalArgumentException + HADOOP-10132. RPC#stopProxy() should log the class of proxy when IllegalArgumentException is encountered (Ted yu via umamahesh) - HADOOP-10248. Property name should be included in the exception where property value + HADOOP-10248. Property name should be included in the exception where property value is null (Akira AJISAKA via umamahesh) HADOOP-10086. User document for authentication in secure cluster. @@ -1837,13 +1834,13 @@ Release 2.3.0 - 2014-02-18 HADOOP-9435. Support building the JNI code against the IBM JVM. (Tian Hong Wang via Colin Patrick McCabe) - HADOOP-9848. Create a MiniKDC for use with security testing. + HADOOP-9848. Create a MiniKDC for use with security testing. (ywskycn via tucu) - HADOOP-9860. Remove class HackedKeytab and HackedKeytabEncoder from + HADOOP-9860. Remove class HackedKeytab and HackedKeytabEncoder from hadoop-minikdc once jira DIRSERVER-1882 solved. (ywskycn via tucu) - HADOOP-9866. convert hadoop-auth testcases requiring kerberos to + HADOOP-9866. convert hadoop-auth testcases requiring kerberos to use minikdc. (ywskycn via tucu) HADOOP-9487 Deprecation warnings in Configuration should go to their @@ -1919,7 +1916,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10164. Allow UGI to login with a known Subject (bobby) HADOOP-10169. Remove the unnecessary synchronized in JvmMetrics class. - (Liang Xie via jing9) + (Liang Xie via jing9) HADOOP-10198. DomainSocket: add support for socketpair. (Colin Patrick McCabe via wang) @@ -1943,7 +1940,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10317. Rename branch-2.3 release version from 2.4.0-SNAPSHOT to 2.3.0-SNAPSHOT. (wang) - HADOOP-10313. Script and jenkins job to produce Hadoop release artifacts. + HADOOP-10313. Script and jenkins job to produce Hadoop release artifacts. (tucu) OPTIMIZATIONS @@ -1974,7 +1971,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10031. FsShell -get/copyToLocal/moveFromLocal should support Windows local path. (Chuan Liu via cnauroth) - HADOOP-10039. Add Hive to the list of projects using + HADOOP-10039. Add Hive to the list of projects using AbstractDelegationTokenSecretManager. (Haohui Mai via jing9) HADOOP-10040. hadoop.cmd in UNIX format and would not run by default on @@ -2000,7 +1997,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10110. hadoop-auth has a build break due to missing dependency. (Chuan Liu via arp) - HADOOP-9114. After defined the dfs.checksum.type as the NULL, write file and hflush will + HADOOP-9114. After defined the dfs.checksum.type as the NULL, write file and hflush will through java.lang.ArrayIndexOutOfBoundsException (Sathish via umamahesh) HADOOP-10130. RawLocalFS::LocalFSFileInputStream.pread does not track @@ -2021,7 +2018,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10090. Jobtracker metrics not updated properly after execution of a mapreduce job. (ivanmi) - HADOOP-10193. hadoop-auth's PseudoAuthenticationHandler can consume getInputStream. + HADOOP-10193. hadoop-auth's PseudoAuthenticationHandler can consume getInputStream. (gchanan via tucu) HADOOP-10178. Configuration deprecation always emit "deprecated" warnings @@ -2044,7 +2041,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-9830. Fix typo at http://hadoop.apache.org/docs/current/ (Kousuke Saruta via Arpit Agarwal) - HADOOP-10255. Rename HttpServer to HttpServer2 to retain older + HADOOP-10255. Rename HttpServer to HttpServer2 to retain older HttpServer in branch-2 for compatibility. (Haohui Mai via suresh) HADOOP-10291. TestSecurityUtil#testSocketAddrWithIP fails due to test @@ -2125,7 +2122,7 @@ Release 2.3.0 - 2014-02-18 HADOOP-10214. Fix multithreaded correctness warnings in ActiveStandbyElector (Liang Xie via kasha) - HADOOP-10223. MiniKdc#main() should close the FileReader it creates. + HADOOP-10223. MiniKdc#main() should close the FileReader it creates. (Ted Yu via tucu) HADOOP-10236. Fix typo in o.a.h.ipc.Client#checkResponse. (Akira Ajisaka @@ -2190,7 +2187,7 @@ Release 2.2.0 - 2013-10-13 HADOOP-10003. HarFileSystem.listLocatedStatus() fails. (Jason Dere and suresh via suresh) - HADOOP-10017. Fix NPE in DFSClient#getDelegationToken when doing Distcp + HADOOP-10017. Fix NPE in DFSClient#getDelegationToken when doing Distcp from a secured cluster to an insecured cluster. (Haohui Mai via jing9) Release 2.1.1-beta - 2013-09-23 @@ -2198,7 +2195,7 @@ Release 2.1.1-beta - 2013-09-23 INCOMPATIBLE CHANGES HADOOP-9944. Fix RpcRequestHeaderProto.callId to be sint32 rather than - uint32 since ipc.Client.CONNECTION_CONTEXT_CALL_ID is signed (i.e. -3) + uint32 since ipc.Client.CONNECTION_CONTEXT_CALL_ID is signed (i.e. -3) (acmurthy) NEW FEATURES @@ -2209,14 +2206,14 @@ Release 2.1.1-beta - 2013-09-23 (Andre Kelpe via harsh) HADOOP-9446. Support Kerberos SPNEGO for IBM JDK. (Yu Gao via llu) - + HADOOP-9787. ShutdownHelper util to shutdown threads and threadpools. (Karthik Kambatla via Sandy Ryza) HADOOP-9803. Add a generic type parameter to RetryInvocationHandler. (szetszwo) - HADOOP-9821. ClientId should have getMsb/getLsb methods. + HADOOP-9821. ClientId should have getMsb/getLsb methods. (Tsuyoshi OZAWA via jing9) HADOOP-9672. Upgrade Avro dependency to 1.7.4. (sandy via kihwal) @@ -2230,7 +2227,7 @@ Release 2.1.1-beta - 2013-09-23 HADOOP-9879. Move the version info of zookeeper dependencies to hadoop-project/pom (Karthik Kambatla via Sandy Ryza) - + HADOOP-9886. Turn warning message in RetryInvocationHandler to debug (arpit) HADOOP-9906. Move HAZKUtil to o.a.h.util.ZKUtil and make inner-classes @@ -2242,7 +2239,7 @@ Release 2.1.1-beta - 2013-09-23 HADOOP-9945. HAServiceState should have a state for stopped services. (Karthik Kambatla via atm) - HADOOP-9962. in order to avoid dependency divergence within Hadoop itself + HADOOP-9962. in order to avoid dependency divergence within Hadoop itself lets enable DependencyConvergence. (rvs via tucu) HADOOP-9669. Reduce the number of byte array creations and copies in @@ -2305,7 +2302,7 @@ Release 2.1.1-beta - 2013-09-23 HADOOP-9557. hadoop-client excludes commons-httpclient. (Lohit Vijayarenu via cnauroth) - HADOOP-9961. versions of a few transitive dependencies diverged between hadoop + HADOOP-9961. versions of a few transitive dependencies diverged between hadoop subprojects. (rvs via tucu) HADOOP-9977. Hadoop services won't start with different keypass and @@ -2351,7 +2348,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9283. Add support for running the Hadoop client on AIX. (atm) - HADOOP-8415. Add getDouble() and setDouble() in + HADOOP-8415. Add getDouble() and setDouble() in org.apache.hadoop.conf.Configuration (Jan van der Lugt via harsh) HADOOP-9338. FsShell Copy Commands Should Optionally Preserve File @@ -2367,13 +2364,13 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-8470. Add NetworkTopologyWithNodeGroup, a 4-layer implementation of NetworkTopology. (Junping Du via szetszwo) - HADOOP-9763. Extends LightWeightGSet to support eviction of expired + HADOOP-9763. Extends LightWeightGSet to support eviction of expired elements. (Tsz Wo (Nicholas) SZE via jing9) - HADOOP-9762. RetryCache utility for implementing RPC retries. + HADOOP-9762. RetryCache utility for implementing RPC retries. (Suresh Srinivas via jing9) - HADOOP-9792. Retry the methods that are tagged @AtMostOnce along + HADOOP-9792. Retry the methods that are tagged @AtMostOnce along with @Idempotent. (suresh) HADOOP-9509. Implement ONCRPC and XDR. (brandonli) @@ -2405,7 +2402,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9358. "Auth failed" log should include exception string (todd) - HADOOP-9401. CodecPool: Add counters for number of (de)compressors + HADOOP-9401. CodecPool: Add counters for number of (de)compressors leased out. (kkambatl via tucu) HADOOP-9450. HADOOP_USER_CLASSPATH_FIRST is not honored; CLASSPATH @@ -2441,7 +2438,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9604. Javadoc of FSDataOutputStream is slightly inaccurate. (Jingguo Yao via atm) - + HADOOP-9625. HADOOP_OPTS not picked up by hadoop command. (Paul Han via arpit) @@ -2503,7 +2500,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9770. Make RetryCache#state non volatile. (suresh) - HADOOP-9786. RetryInvocationHandler#isRpcInvocation should support + HADOOP-9786. RetryInvocationHandler#isRpcInvocation should support ProtocolTranslator. (suresh and jing9) OPTIMIZATIONS @@ -2550,10 +2547,10 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9342. Remove jline from distribution. (thw via tucu) - HADOOP-9230. TestUniformSizeInputFormat fails intermittently. + HADOOP-9230. TestUniformSizeInputFormat fails intermittently. (kkambatl via tucu) - HADOOP-9349. Confusing output when running hadoop version from one hadoop + HADOOP-9349. Confusing output when running hadoop version from one hadoop installation when HADOOP_HOME points to another. (sandyr via tucu) HADOOP-9337. org.apache.hadoop.fs.DF.getMount() does not work on Mac OS. @@ -2562,7 +2559,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9369. DNS#reverseDns() can return hostname with . appended at the end. (Karthik Kambatla via atm) - HADOOP-9379. capture the ulimit info after printing the log to the + HADOOP-9379. capture the ulimit info after printing the log to the console. (Arpit Gupta via suresh) HADOOP-9399. protoc maven plugin doesn't work on mvn 3.0.2 (todd) @@ -2581,7 +2578,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9429. TestConfiguration fails with IBM JAVA. (Amir Sanjar via suresh) - HADOOP-9222. Cover package with org.apache.hadoop.io.lz4 unit tests (Vadim + HADOOP-9222. Cover package with org.apache.hadoop.io.lz4 unit tests (Vadim Bondarev via jlowe) HADOOP-9233. Cover package org.apache.hadoop.io.compress.zlib with unit @@ -2680,12 +2677,12 @@ Release 2.1.0-beta - 2013-08-22 (Bikas Saha, Chuan Liu, Giridharan Kesavan, Ivan Mitic, and Steve Maine ported by Chris Nauroth via suresh) - HADOOP-8946. winutils: compile codebase during Maven build on + HADOOP-8946. winutils: compile codebase during Maven build on branch-trunk-win. (Chris Nauroth via suresh) - HADOOP-8947. Merge FileUtil and Shell changes from branch-1-win to - branch-trunk-win to enable initial test pass. (Raja Aluri, Davio Lao, - Sumadhur Reddy Bolli, Ahmed El Baz, Kanna Karanam, Chuan Liu, + HADOOP-8947. Merge FileUtil and Shell changes from branch-1-win to + branch-trunk-win to enable initial test pass. (Raja Aluri, Davio Lao, + Sumadhur Reddy Bolli, Ahmed El Baz, Kanna Karanam, Chuan Liu, Ivan Mitic, Chris Nauroth, and Bikas Saha via suresh) HADOOP-8954. "stat" executable not found on Windows. (Bikas Saha, Ivan Mitic @@ -2702,7 +2699,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-8961. GenericOptionsParser URI parsing failure on Windows. (Ivan Mitic via suresh) - HADOOP-8949. Remove FileUtil.CygPathCommand dead code. (Chris Nauroth via + HADOOP-8949. Remove FileUtil.CygPathCommand dead code. (Chris Nauroth via suresh) HADOOP-8956. FileSystem.primitiveMkdir failures on Windows cause multiple @@ -2721,7 +2718,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-8977. Multiple FsShell test failures on Windows. (Chris Nauroth via suresh) - HADOOP-9005. Merge hadoop cmd line scripts from branch-1-win. (David Lao, + HADOOP-9005. Merge hadoop cmd line scripts from branch-1-win. (David Lao, Bikas Saha, Lauren Yang, Chuan Liu, Thejas M Nair and Ivan Mitic via suresh) HADOOP-9008. Building hadoop tarball fails on Windows. (Chris Nauroth via @@ -2730,7 +2727,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9011. saveVersion.py does not include branch in version annotation. (Chris Nauroth via suresh) - HADOOP-9110. winutils ls off-by-one error indexing MONTHS array can cause + HADOOP-9110. winutils ls off-by-one error indexing MONTHS array can cause access violation. (Chris Nauroth via suresh) HADOOP-9056. Build native library on Windows. (Chuan Liu, Arpit Agarwal via @@ -2738,7 +2735,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9144. Fix findbugs warnings. (Chris Nauroth via suresh) - HADOOP-9081. Add TestWinUtils. (Chuan Liu, Ivan Mitic, Chris Nauroth, + HADOOP-9081. Add TestWinUtils. (Chuan Liu, Ivan Mitic, Chris Nauroth, and Bikas Saha via suresh) HADOOP-9146. Fix sticky bit regression on branch-trunk-win. @@ -2812,10 +2809,10 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9290. Some tests cannot load native library on windows. (Chris Nauroth via suresh) - HADOOP-9500. TestUserGroupInformation#testGetServerSideGroups fails on + HADOOP-9500. TestUserGroupInformation#testGetServerSideGroups fails on Windows due to failure to find winutils.exe. (Chris Nauroth via suresh) - HADOOP-9490. LocalFileSystem#reportChecksumFailure not closing the + HADOOP-9490. LocalFileSystem#reportChecksumFailure not closing the checksum file handle before rename. (Ivan Mitic via suresh) HADOOP-9524. Fix ShellCommandFencer to work on Windows. @@ -2832,7 +2829,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9483. winutils support for readlink command. (Arpit Agarwal via suresh) - + HADOOP-9488. FileUtil#createJarWithClassPath only substitutes environment variables from current process environment/does not support overriding when launching new process (Chris Nauroth via bikas) @@ -2854,7 +2851,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-8982. TestSocketIOWithTimeout fails on Windows. (Chris Nauroth via suresh) - HADOOP-8958. ViewFs:Non absolute mount name failures when running + HADOOP-8958. ViewFs:Non absolute mount name failures when running multiple tests on Windows. (Chris Nauroth via suresh) HADOOP-9599. hadoop-config.cmd doesn't set JAVA_LIBRARY_PATH correctly. @@ -2863,7 +2860,7 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-9637. Adding Native Fstat for Windows as needed by YARN. (Chuan Liu via cnauroth) - HADOOP-9264. Port change to use Java untar API on Windows from + HADOOP-9264. Port change to use Java untar API on Windows from branch-1-win to trunk. (Chris Nauroth via suresh) HADOOP-9678. TestRPC#testStopsAllThreads intermittently fails on Windows. @@ -2878,8 +2875,8 @@ Release 2.1.0-beta - 2013-08-22 HADOOP-8440. HarFileSystem.decodeHarURI fails for URIs whose host contains numbers. (Ivan Mitic via cnauroth) - HADOOP-9643. org.apache.hadoop.security.SecurityUtil calls - toUpperCase(Locale.getDefault()) as well as toLowerCase(Locale.getDefault()) + HADOOP-9643. org.apache.hadoop.security.SecurityUtil calls + toUpperCase(Locale.getDefault()) as well as toLowerCase(Locale.getDefault()) on hadoop.security.authentication value. (markrmiller@gmail.com via tucu) HADOOP-9701. mvn site ambiguous links in hadoop-common. (kkambatl via tucu) @@ -2940,10 +2937,10 @@ Release 2.0.4-alpha - 2013-04-25 HADOOP-9444. Modify hadoop-policy.xml to replace unexpanded variables to a default value of '*'. (Roman Shaposhnik via vinodkv) - HADOOP-9471. hadoop-client wrongfully excludes jetty-util JAR, + HADOOP-9471. hadoop-client wrongfully excludes jetty-util JAR, breaking webhdfs. (tucu) -Release 2.0.3-alpha - 2013-02-06 +Release 2.0.3-alpha - 2013-02-06 INCOMPATIBLE CHANGES @@ -2962,7 +2959,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9090. Support on-demand publish of metrics. (Mostafa Elhemali via suresh) - HADOOP-9054. Add AuthenticationHandler that uses Kerberos but allows for + HADOOP-9054. Add AuthenticationHandler that uses Kerberos but allows for an alternate form of authentication for browsers. (rkanter via tucu) IMPROVEMENTS @@ -3016,7 +3013,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-8925. Remove the packaging. (eli) - HADOOP-8985. Add namespace declarations in .proto files for languages + HADOOP-8985. Add namespace declarations in .proto files for languages other than java. (Binglin Chan via suresh) HADOOP-9009. Add SecurityUtil methods to get/set authentication method @@ -3131,10 +3128,10 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-8881. FileBasedKeyStoresFactory initialization logging should be debug not info. (tucu) - HADOOP-8913. hadoop-metrics2.properties should give units in comment + HADOOP-8913. hadoop-metrics2.properties should give units in comment for sampling period. (Sandy Ryza via suresh) - HADOOP-8878. Uppercase namenode hostname causes hadoop dfs calls with + HADOOP-8878. Uppercase namenode hostname causes hadoop dfs calls with webhdfs filesystem and fsck to fail when security is on. (Arpit Gupta via suresh) @@ -3150,7 +3147,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-8948. TestFileUtil.testGetDU fails on Windows due to incorrect assumption of line separator. (Chris Nauroth via suresh) - HADOOP-8951. RunJar to fail with user-comprehensible error + HADOOP-8951. RunJar to fail with user-comprehensible error message if jar missing. (stevel via suresh) HADOOP-8713. TestRPCCompatibility fails intermittently with JDK7 @@ -3165,7 +3162,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9049. DelegationTokenRenewer needs to be Singleton and FileSystems should register/deregister to/from. (Karthik Kambatla via tomwhite) - HADOOP-9064. Augment DelegationTokenRenewer API to cancel the tokens on + HADOOP-9064. Augment DelegationTokenRenewer API to cancel the tokens on calls to removeRenewAction. (kkambatl via tucu) HADOOP-9103. UTF8 class does not properly decode Unicode characters @@ -3205,9 +3202,9 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9178. src/main/conf is missing hadoop-policy.xml. (Sandy Ryza via eli) - HADOOP-8816. HTTP Error 413 full HEAD if using kerberos authentication. + HADOOP-8816. HTTP Error 413 full HEAD if using kerberos authentication. (moritzmoeller via tucu) - + HADOOP-9212. Potential deadlock in FileSystem.Cache/IPC/UGI. (tomwhite) HADOOP-8589 ViewFs tests fail when tests and home dirs are nested. @@ -3219,7 +3216,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9215. when using cmake-2.6, libhadoop.so doesn't get created (only libhadoop.so.1.0.0) (Colin Patrick McCabe via todd) - HADOOP-8857. hadoop.http.authentication.signature.secret.file docs + HADOOP-8857. hadoop.http.authentication.signature.secret.file docs should not state that secret is randomly generated. (tucu) HADOOP-9190. packaging docs is broken. (Andy Isaacson via tgraves) @@ -3227,7 +3224,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9221. Convert remaining xdocs to APT. (Andy Isaacson via atm) HADOOP-8981. TestMetricsSystemImpl fails on Windows. (Xuan Gong via suresh) - + HADOOP-9124. SortedMapWritable violates contract of Map interface for equals() and hashCode(). (Surenkumar Nihalani via tomwhite) @@ -3243,7 +3240,7 @@ Release 2.0.3-alpha - 2013-02-06 HADOOP-9289. FsShell rm -f fails for non-matching globs. (Daryn Sharp via suresh) -Release 2.0.2-alpha - 2012-09-07 +Release 2.0.2-alpha - 2012-09-07 INCOMPATIBLE CHANGES @@ -3253,18 +3250,18 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8689. Make trash a server side configuration option. (eli) HADOOP-8710. Remove ability for users to easily run the trash emptire. (eli) - + HADOOP-8794. Rename YARN_HOME to HADOOP_YARN_HOME. (vinodkv via acmurthy) NEW FEATURES - + HDFS-3042. Automatic failover support for NameNode HA (todd) (see dedicated section below for breakdown of subtasks) HADOOP-8135. Add ByteBufferReadable interface to FSDataInputStream. (Henry Robinson via atm) - HADOOP-8458. Add management hook to AuthenticationHandler to enable + HADOOP-8458. Add management hook to AuthenticationHandler to enable delegation token operations support (tucu) HADOOP-8465. hadoop-auth should support ephemeral authentication (tucu) @@ -3273,7 +3270,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8581. add support for HTTPS to the web UIs. (tucu) - HADOOP-7754. Expose file descriptors from Hadoop-wrapped local + HADOOP-7754. Expose file descriptors from Hadoop-wrapped local FileSystems (todd and ahmed via tucu) HADOOP-8240. Add a new API to allow users to specify a checksum type @@ -3375,14 +3372,14 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8801. ExitUtil#terminate should capture the exception stack trace. (eli) - HADOOP-8819. Incorrectly & is used instead of && in some file system + HADOOP-8819. Incorrectly & is used instead of && in some file system implementations. (Brandon Li via suresh) - HADOOP-7808. Port HADOOP-7510 - Add configurable option to use original - hostname in token instead of IP to allow server IP change. + HADOOP-7808. Port HADOOP-7510 - Add configurable option to use original + hostname in token instead of IP to allow server IP change. (Daryn Sharp via suresh) - HADOOP-8367 Improve documentation of declaringClassProtocolName in + HADOOP-8367 Improve documentation of declaringClassProtocolName in rpc headers. (Sanjay Radia) HADOOP-8624. ProtobufRpcEngine should log all RPCs if TRACE logging is @@ -3393,12 +3390,12 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8372. NetUtils.normalizeHostName() incorrectly handles hostname starting with a numeric character. (Junping Du via suresh) - HADOOP-8393. hadoop-config.sh missing variable exports, causes Yarn jobs + HADOOP-8393. hadoop-config.sh missing variable exports, causes Yarn jobs to fail with ClassNotFoundException MRAppMaster. (phunt via tucu) HADOOP-8316. Audit logging should be disabled by default. (eli) - HADOOP-8400. All commands warn "Kerberos krb5 configuration not found" + HADOOP-8400. All commands warn "Kerberos krb5 configuration not found" when security is not enabled. (tucu) HADOOP-8406. CompressionCodecFactory.CODEC_PROVIDERS iteration is @@ -3418,10 +3415,10 @@ Release 2.0.2-alpha - 2012-09-07 FileContextMainOperationsBaseTest.java to avoid potential test failure (Madhukara Phatak via harsh) - HADOOP-8452. DN logs backtrace when running under jsvc and /jmx is loaded + HADOOP-8452. DN logs backtrace when running under jsvc and /jmx is loaded (Andy Isaacson via bobby) - HADOOP-8460. Document proper setting of HADOOP_PID_DIR and + HADOOP-8460. Document proper setting of HADOOP_PID_DIR and HADOOP_SECURE_DN_PID_DIR (bobby) HADOOP-8466. hadoop-client POM incorrectly excludes avro. (bmahe via tucu) @@ -3442,10 +3439,10 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8509. JarFinder duplicate entry: META-INF/MANIFEST.MF exception (tucu) - HADOOP-8512. AuthenticatedURL should reset the Token when the server returns + HADOOP-8512. AuthenticatedURL should reset the Token when the server returns other than OK on authentication (tucu) - HADOOP-8168. empty-string owners or groups causes {{MissingFormatWidthException}} + HADOOP-8168. empty-string owners or groups causes {{MissingFormatWidthException}} in o.a.h.fs.shell.Ls.ProcessPath() (ekoontz via tucu) HADOOP-8438. hadoop-validate-setup.sh refers to examples jar file which doesn't exist @@ -3459,7 +3456,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8563. don't package hadoop-pipes examples/bin (Colin Patrick McCabe via tgraves) - HADOOP-8566. AvroReflectSerializer.accept(Class) throws a NPE if the class has no + HADOOP-8566. AvroReflectSerializer.accept(Class) throws a NPE if the class has no package (primitive types and arrays). (tucu) HADOOP-8586. Fixup a bunch of SPNEGO misspellings. (eli) @@ -3472,7 +3469,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8585. Fix initialization circularity between UserGroupInformation and HadoopConfiguration. (Colin Patrick McCabe via atm) - HADOOP-8552. Conflict: Same security.log.file for multiple users. + HADOOP-8552. Conflict: Same security.log.file for multiple users. (kkambatl via tucu) HADOOP-8537. Fix TFile tests to pass even when native zlib support is not @@ -3491,7 +3488,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8654. TextInputFormat delimiter bug (Gelesh and Jason Lowe via bobby) - HADOOP-8614. IOUtils#skipFully hangs forever on EOF. + HADOOP-8614. IOUtils#skipFully hangs forever on EOF. (Colin Patrick McCabe via eli) HADOOP-8720. TestLocalFileSystem should use test root subdirectory. @@ -3502,7 +3499,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8632. Configuration leaking class-loaders (Costin Leau via bobby) - HADOOP-4572. Can not access user logs - Jetty is not configured by default + HADOOP-4572. Can not access user logs - Jetty is not configured by default to serve aliases/symlinks (ahmed via tucu) HADOOP-8660. TestPseudoAuthenticator failing with NPE. (tucu) @@ -3510,7 +3507,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8699. some common testcases create core-site.xml in test-classes making other testcases to fail. (tucu) - HADOOP-8031. Configuration class fails to find embedded .jar resources; + HADOOP-8031. Configuration class fails to find embedded .jar resources; should use URL.openStream() (genman via tucu) HADOOP-8737. cmake: always use JAVA_HOME to find libjvm.so, jni.h, jni_md.h. @@ -3531,7 +3528,7 @@ Release 2.0.2-alpha - 2012-09-07 HADOOP-8766. FileContextMainOperationsBaseTest should randomize the root dir. (Colin Patrick McCabe via atm) - HADOOP-8749. HADOOP-8031 changed the way in which relative xincludes are handled in + HADOOP-8749. HADOOP-8031 changed the way in which relative xincludes are handled in Configuration. (ahmed via tucu) HADOOP-8431. Running distcp wo args throws IllegalArgumentException. @@ -3548,30 +3545,30 @@ Release 2.0.2-alpha - 2012-09-07 correctly (todd) HADOOP-8228. Auto HA: Refactor tests and add stress tests. (todd) - + HADOOP-8215. Security support for ZK Failover controller (todd) - + HADOOP-8245. Fix flakiness in TestZKFailoverController (todd) - + HADOOP-8257. TestZKFailoverControllerStress occasionally fails with Mockito error (todd) - + HADOOP-8260. Replace ClientBaseWithFixes with our own modified copy of the class (todd) - + HADOOP-8246. Auto-HA: automatically scope znode by nameservice ID (todd) - + HADOOP-8247. Add a config to enable auto-HA, which disables manual FailoverController (todd) - + HADOOP-8306. ZKFC: improve error message when ZK is not running. (todd) - + HADOOP-8279. Allow manual failover to be invoked when auto-failover is enabled. (todd) - + HADOOP-8276. Auto-HA: add config for java options to pass to zkfc daemon (todd via eli) - + HADOOP-8405. ZKFC tests leak ZK instances. (todd) Release 2.0.0-alpha - 05-23-2012 @@ -3604,7 +3601,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8210. Common side of HDFS-3148: The client should be able to use multiple local interfaces for data transfer. (eli) - HADOOP-8343. Allow configuration of authorization for JmxJsonServlet and + HADOOP-8343. Allow configuration of authorization for JmxJsonServlet and MetricsServlet (tucu) IMPROVEMENTS @@ -3633,20 +3630,20 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-7899. Generate proto java files as part of the build. (tucu) - HADOOP-7957. Classes deriving GetGroupsBase should be able to override + HADOOP-7957. Classes deriving GetGroupsBase should be able to override proxy creation. (jitendra) HADOOP-7965. Support for protocol version and signature in PB. (jitendra) HADOOP-8070. Add a standalone benchmark for RPC call performance. (todd) - HADOOP-8084. Updates ProtoBufRpc engine to not do an unnecessary copy + HADOOP-8084. Updates ProtoBufRpc engine to not do an unnecessary copy for RPC request/response. (ddas) HADOOP-8085. Add RPC metrics to ProtobufRpcEngine. (Hari Mankude via suresh) - HADOOP-8098. KerberosAuthenticatorHandler should use _HOST replacement to + HADOOP-8098. KerberosAuthenticatorHandler should use _HOST replacement to resolve principal name (tucu) HADOOP-8118. In metrics2.util.MBeans, change log level to trace for the @@ -3668,14 +3665,14 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-7806. Support binding to sub-interfaces (eli) - HADOOP-6941. Adds support for building Hadoop with IBM's JDK + HADOOP-6941. Adds support for building Hadoop with IBM's JDK (Stephen Watt, Eli and ddas) HADOOP-8183. Stop using "mapred.used.genericoptions.parser" (harsh) HADOOP-6924. Adds a directory to the list of directories to search for the libjvm.so file. The new directory is found by running a 'find' - command and the first output is taken. This was done to handle the + command and the first output is taken. This was done to handle the build of Hadoop with IBM's JDK. (Stephen Watt, Guillermo Cabrera and ddas) HADOOP-8200. Remove HADOOP_[JOBTRACKER|TASKTRACKER]_OPTS. (eli) @@ -3711,7 +3708,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8077. HA: fencing method should be able to be configured on a per-NN or per-NS basis (todd) - HADOOP-8086. KerberosName silently sets defaultRealm to "" if the + HADOOP-8086. KerberosName silently sets defaultRealm to "" if the Kerberos config is not found, it should log a WARN (tucu) HADOOP-8280. Move VersionUtil/TestVersionUtil and GenericTestUtils from @@ -3734,7 +3731,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8350. Improve NetUtils.getInputStream to return a stream which has a tunable timeout. (todd) - HADOOP-8356. FileSystem service loading mechanism should print the FileSystem + HADOOP-8356. FileSystem service loading mechanism should print the FileSystem impl it is failing to load (tucu) HADOOP-8353. hadoop-daemon.sh and yarn-daemon.sh can be misleading on stop. @@ -3752,7 +3749,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-7987. Support setting the run-as user in unsecure mode. (jitendra) - HADOOP-7994. Remove getProtocolVersion and getProtocolSignature from the + HADOOP-7994. Remove getProtocolVersion and getProtocolSignature from the client side translator and server side implementation. (jitendra) OPTIMIZATIONS @@ -3760,7 +3757,7 @@ Release 2.0.0-alpha - 05-23-2012 BUG FIXES HADOOP-8199. Fix issues in start-all.sh and stop-all.sh (Devaraj K via umamahesh) - + HADOOP-7635. RetryInvocationHandler should release underlying resources on close. (atm) @@ -3827,7 +3824,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8251. Fix SecurityUtil.fetchServiceTicket after HADOOP-6941 (todd) - HADOOP-8249. invalid hadoop-auth cookies should trigger authentication + HADOOP-8249. invalid hadoop-auth cookies should trigger authentication if info is avail before returning HTTP 401 (tucu) HADOOP-8261. Har file system doesn't deal with FS URIs with a host but no @@ -3854,10 +3851,10 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8284. clover integration broken, also mapreduce poms are pulling in clover as a dependency. (phunt via tucu) - HADOOP-8309. Pseudo & Kerberos AuthenticationHandler should use + HADOOP-8309. Pseudo & Kerberos AuthenticationHandler should use getType() to create token (tucu) - HADOOP-8314. HttpServer#hasAdminAccess should return false if + HADOOP-8314. HttpServer#hasAdminAccess should return false if authorization is enabled but user is not authenticated. (tucu) HADOOP-8296. hadoop/yarn daemonlog usage wrong (Devaraj K via tgraves) @@ -3872,7 +3869,7 @@ Release 2.0.0-alpha - 05-23-2012 HADOOP-8275. Range check DelegationKey length. (Colin Patrick McCabe via eli) - HADOOP-8342. HDFS command fails with exception following merge of + HADOOP-8342. HDFS command fails with exception following merge of HADOOP-8325 (tucu) HADOOP-8346. Makes oid changes to make SPNEGO work. Was broken due @@ -3894,66 +3891,66 @@ Release 2.0.0-alpha - 05-23-2012 BREAKDOWN OF HADOOP-7454 SUBTASKS HADOOP-7455. HA: Introduce HA Service Protocol Interface. (suresh) - + HADOOP-7774. HA: Administrative CLI to control HA daemons. (todd) - + HADOOP-7896. HA: if both NNs are in Standby mode, client needs to try failing back and forth several times with sleeps. (atm) - + HADOOP-7922. Improve some logging for client IPC failovers and StandbyExceptions (todd) - + HADOOP-7921. StandbyException should extend IOException (todd) - + HADOOP-7928. HA: Client failover policy is incorrectly trying to fail over all IOExceptions (atm) - + HADOOP-7925. Add interface and update CLI to query current state to HAServiceProtocol (eli via todd) - + HADOOP-7932. Make client connection retries on socket time outs configurable. (Uma Maheswara Rao G via todd) - + HADOOP-7924. FailoverController for client-based configuration (eli) - + HADOOP-7961. Move HA fencing to common. (eli) - + HADOOP-7970. HAServiceProtocol methods must throw IOException. (Hari Mankude via suresh). - + HADOOP-7992. Add ZKClient library to facilitate leader election. (Bikas Saha via suresh). - + HADOOP-7983. HA: failover should be able to pass args to fencers. (eli) - + HADOOP-7938. HA: the FailoverController should optionally fence the active during failover. (eli) - + HADOOP-7991. HA: the FailoverController should check the standby is ready before failing over. (eli) - + HADOOP-8038. Add 'ipc.client.connect.max.retries.on.timeouts' entry in core-default.xml file. (Uma Maheswara Rao G via atm) - + HADOOP-8041. Log a warning when a failover is first attempted (todd) - + HADOOP-8068. void methods can swallow exceptions when going through failover path (todd) - + HADOOP-8116. RetriableCommand is using RetryPolicy incorrectly after HADOOP-7896. (atm) HADOOP-8317. Update maven-assembly-plugin to 2.3 - fix build on FreeBSD (Radim Kolar via bobby) - HADOOP-8172. Configuration no longer sets all keys in a deprecated key + HADOOP-8172. Configuration no longer sets all keys in a deprecated key list. (Anupam Seth via bobby) HADOOP-7868. Hadoop native fails to compile when default linker option is -Wl,--as-needed. (Trevor Robinson via eli) HADOOP-8655. Fix TextInputFormat for large deliminators. (Gelesh via - bobby) + bobby) HADOOP-7900. LocalDirAllocator confChanged() accesses conf.get() twice (Ravi Gummadi via Uma Maheswara Rao G) @@ -3981,9 +3978,9 @@ Release 0.23.11 - UNRELEASED INCOMPATIBLE CHANGES NEW FEATURES - + IMPROVEMENTS - + OPTIMIZATIONS BUG FIXES @@ -4021,9 +4018,9 @@ Release 0.23.9 - 2013-07-08 INCOMPATIBLE CHANGES NEW FEATURES - + IMPROVEMENTS - + OPTIMIZATIONS BUG FIXES @@ -4046,7 +4043,7 @@ Release 0.23.8 - 2013-06-05 BUG FIXES - HADOOP-9222. Cover package with org.apache.hadoop.io.lz4 unit tests (Vadim + HADOOP-9222. Cover package with org.apache.hadoop.io.lz4 unit tests (Vadim Bondarev via jlowe) HADOOP-9233. Cover package org.apache.hadoop.io.compress.zlib with unit @@ -4102,7 +4099,7 @@ Release 0.23.7 - 2013-04-18 HADOOP-9303. command manual dfsadmin missing entry for restoreFailedStorage option (Andy Isaacson via tgraves) - HADOOP-9339. IPC.Server incorrectly sets UGI auth type (Daryn Sharp via + HADOOP-9339. IPC.Server incorrectly sets UGI auth type (Daryn Sharp via kihwal) Release 0.23.6 - 2013-02-06 @@ -4126,7 +4123,7 @@ Release 0.23.6 - 2013-02-06 BUG FIXES - HADOOP-9072. Hadoop-Common-0.23-Build Fails to build in Jenkins + HADOOP-9072. Hadoop-Common-0.23-Build Fails to build in Jenkins (Robert Parker via tgraves) HADOOP-8992. Enhance unit-test coverage of class HarFileSystem (Ivan A. @@ -4150,7 +4147,7 @@ Release 0.23.5 - 2012-11-28 IMPROVEMENTS - HADOOP-8932. JNI-based user-group mapping modules can be too chatty on + HADOOP-8932. JNI-based user-group mapping modules can be too chatty on lookup failures. (Kihwal Lee via suresh) HADOOP-8930. Cumulative code coverage calculation (Andrey Klochkov via @@ -4268,7 +4265,7 @@ Release 0.23.3 HADOOP-8129. ViewFileSystemTestSetup setupForViewFileSystem is erring (Ahmed Radwan and Ravi Prakash via bobby) - HADOOP-8573. Configuration tries to read from an inputstream resource + HADOOP-8573. Configuration tries to read from an inputstream resource multiple times (Robert Evans via tgraves) HADOOP-8599. Non empty response from FileSystem.getFileBlockLocations when @@ -4285,7 +4282,7 @@ Release 0.23.3 HADOOP-8627. FS deleteOnExit may delete the wrong path (daryn via bobby) - HADOOP-8634. Ensure FileSystem#close doesn't squawk for deleteOnExit paths + HADOOP-8634. Ensure FileSystem#close doesn't squawk for deleteOnExit paths (daryn via bobby) HADOOP-8550. hadoop fs -touchz automatically created parent directories @@ -4295,7 +4292,7 @@ Release 0.23.3 HADOOP-8637. FilterFileSystem#setWriteChecksum is broken (daryn via bobby) - HADOOP-8370. Native build failure: javah: class file for + HADOOP-8370. Native build failure: javah: class file for org.apache.hadoop.classification.InterfaceAudience not found (Trevor Robinson via tgraves) @@ -4308,7 +4305,7 @@ Release 0.23.3 HADOOP-8390. TestFileSystemCanonicalization fails with JDK7 (Trevor Robinson via tgraves) - HADOOP-8692. TestLocalDirAllocator fails intermittently with JDK7 + HADOOP-8692. TestLocalDirAllocator fails intermittently with JDK7 (Trevor Robinson via tgraves) HADOOP-8693. TestSecurityUtil fails intermittently with JDK7 (Trevor @@ -4320,8 +4317,8 @@ Release 0.23.3 HADOOP-8695. TestPathData fails intermittently with JDK7 (Trevor Robinson via tgraves) - HADOOP-8611. Allow fall-back to the shell-based implementation when - JNI-based users-group mapping fails (Robert Parker via bobby) + HADOOP-8611. Allow fall-back to the shell-based implementation when + JNI-based users-group mapping fails (Robert Parker via bobby) HADOOP-8225. DistCp fails when invoked by Oozie (daryn via bobby) @@ -4336,16 +4333,16 @@ Release 0.23.3 HADOOP-8727. Gracefully deprecate dfs.umaskmode in 2.x onwards (Harsh J via bobby) -Release 0.23.2 - UNRELEASED +Release 0.23.2 - UNRELEASED INCOMPATIBLE CHANGES - NEW FEATURES - + NEW FEATURES + IMPROVEMENTS HADOOP-8048. Allow merging of Credentials (Daryn Sharp via tgraves) - + HADOOP-8032. mvn site:stage-deploy should be able to use the scp protocol to stage documents (Ravi Prakash via tgraves) @@ -4353,7 +4350,7 @@ Release 0.23.2 - UNRELEASED (szetszwo) HADOOP-8137. Added links to CLI manuals to the site. (tgraves via - acmurthy) + acmurthy) OPTIMIZATIONS HADOOP-8071. Avoid an extra packet in client code when nagling is @@ -4365,7 +4362,7 @@ Release 0.23.2 - UNRELEASED BUG FIXES - HADOOP-7660. Maven generated .classpath doesnot includes + HADOOP-7660. Maven generated .classpath doesnot includes "target/generated-test-source/java" as source directory. (Laxman via bobby) @@ -4380,14 +4377,14 @@ Release 0.23.2 - UNRELEASED HADOOP-8055. Hadoop tarball distribution lacks a core-site.xml (harsh) - HADOOP-8052. Hadoop Metrics2 should emit Float.MAX_VALUE (instead of + HADOOP-8052. Hadoop Metrics2 should emit Float.MAX_VALUE (instead of Double.MAX_VALUE) to avoid making Ganglia's gmetad core. (Varun Kapoor via mattf) HADOOP-8074. Small bug in hadoop error message for unknown commands. (Colin Patrick McCabe via eli) - HADOOP-8082 add hadoop-client and hadoop-minicluster to the + HADOOP-8082 add hadoop-client and hadoop-minicluster to the dependency-management section. (tucu) HADOOP-8066 The full docs build intermittently fails (abayer via tucu) @@ -4412,7 +4409,7 @@ Release 0.23.2 - UNRELEASED (Daryn Sharp via bobby) HADOOP-8123. Use java.home rather than env.JAVA_HOME for java in the - project. (Jonathan Eagles via acmurthy) + project. (Jonathan Eagles via acmurthy) HADOOP-8064. Remove unnecessary dependency on w3c.org in document processing (Khiwal Lee via bobby) @@ -4433,13 +4430,13 @@ Release 0.23.2 - UNRELEASED HADOOP-8208. Disallow self failover. (eli) -Release 0.23.1 - 2012-02-17 +Release 0.23.1 - 2012-02-17 INCOMPATIBLE CHANGES NEW FEATURES - HADOOP-7777 Implement a base class for DNSToSwitchMapping implementations + HADOOP-7777 Implement a base class for DNSToSwitchMapping implementations that can offer extra topology information. (stevel) HADOOP-7657. Add support for LZ4 compression. (Binglin Chang via todd) @@ -4466,7 +4463,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7877. Update balancer CLI usage documentation to include the new -policy option. (szetszwo) - HADOOP-6840. Support non-recursive create() in FileSystem and + HADOOP-6840. Support non-recursive create() in FileSystem and SequenceFile.Writer. (jitendra and eli via eli) HADOOP-6886. LocalFileSystem Needs createNonRecursive API. @@ -4483,7 +4480,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7933. Add a getDelegationTokens api to FileSystem which checks for known tokens in the passed Credentials object. (sseth) - HADOOP-7737. normalize hadoop-mapreduce & hadoop-dist dist/tar build with + HADOOP-7737. normalize hadoop-mapreduce & hadoop-dist dist/tar build with common/hdfs. (tucu) HADOOP-7743. Add Maven profile to create a full source tarball. (tucu) @@ -4509,7 +4506,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7736. Remove duplicate Path#normalizePath call. (harsh) - HADOOP-7919. Remove the unused hadoop.logfile.* properties from the + HADOOP-7919. Remove the unused hadoop.logfile.* properties from the core-default.xml file. (harsh) HADOOP-7939. Improve Hadoop subcomponent integration in Hadoop 0.23. (rvs via tucu) @@ -4517,7 +4514,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-8002. SecurityUtil acquired token message should be a debug rather than info. (Arpit Gupta via mahadev) - HADOOP-8009. Create hadoop-client and hadoop-minicluster artifacts for downstream + HADOOP-8009. Create hadoop-client and hadoop-minicluster artifacts for downstream projects. (tucu) HADOOP-7470. Move up to Jackson 1.8.8. (Enis Soztutar via szetszwo) @@ -4532,7 +4529,7 @@ Release 0.23.1 - 2012-02-17 OPTIMIZATIONS BUG FIXES - + HADOOP-7811. TestUserGroupInformation#testGetServerSideGroups test fails in chroot. (Jonathan Eagles via mahadev) @@ -4541,7 +4538,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7841. Run tests with non-secure random. (tlipcon) - HADOOP-7851. Configuration.getClasses() never returns the default value. + HADOOP-7851. Configuration.getClasses() never returns the default value. (Uma Maheswara Rao G via amarrk) HADOOP-7787. Make source tarball use conventional name. @@ -4570,13 +4567,13 @@ Release 0.23.1 - 2012-02-17 HADOOP-7837. no NullAppender in the log4j config. (eli) - HADOOP-7948. Shell scripts created by hadoop-dist/pom.xml to build tar do not + HADOOP-7948. Shell scripts created by hadoop-dist/pom.xml to build tar do not properly propagate failure. (cim_michajlomatijkiw via tucu) HADOOP-7949. Updated maxIdleTime default in the code to match core-default.xml (eli) - HADOOP-7853. multiple javax security configurations cause conflicts. + HADOOP-7853. multiple javax security configurations cause conflicts. (daryn via tucu) HDFS-2614. hadoop dist tarball is missing hdfs headers. (tucu) @@ -4586,7 +4583,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7887. KerberosAuthenticatorHandler is not setting KerberosName name rules from configuration. (tucu) - HADOOP-7902. skipping name rules setting (if already set) should be done + HADOOP-7902. skipping name rules setting (if already set) should be done on UGI initialization only. (tucu) HADOOP-7810. move hadoop archive to core from tools. (tucu) @@ -4607,7 +4604,7 @@ Release 0.23.1 - 2012-02-17 directory. (harsh via eli) HADOOP-7971. Adding back job/pipes/queue commands to bin/hadoop for - backward compatibility. (Prashath Sharma via acmurthy) + backward compatibility. (Prashath Sharma via acmurthy) HADOOP-7982. UserGroupInformation fails to login if thread's context classloader can't load HadoopLoginModule. (todd) @@ -4621,7 +4618,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-7997. SequenceFile.createWriter(...createParent...) no longer works on existing file. (Gregory Chanan via eli) - HADOOP-7993. Hadoop ignores old-style config options for enabling compressed + HADOOP-7993. Hadoop ignores old-style config options for enabling compressed output. (Anupam Seth via mahadev) HADOOP-8000. fetchdt command not available in bin/hadoop. @@ -4638,7 +4635,7 @@ Release 0.23.1 - 2012-02-17 HADOOP-8054 NPE with FilterFileSystem (Daryn Sharp via bobby) -Release 0.23.0 - 2011-11-01 +Release 0.23.0 - 2011-11-01 INCOMPATIBLE CHANGES @@ -4670,7 +4667,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7257 Client side mount tables (sanjay) - HADOOP-6919. New metrics2 framework. (Luke Lu via acmurthy) + HADOOP-6919. New metrics2 framework. (Luke Lu via acmurthy) HADOOP-6920. Metrics instrumentation to move new metrics2 framework. (Luke Lu via suresh) @@ -4882,7 +4879,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7384. Allow test-patch to be more flexible about patch format. (todd) - HADOOP-6929. RPC should have a way to pass Security information other than + HADOOP-6929. RPC should have a way to pass Security information other than protocol annotations. (sharad and omalley via mahadev) HADOOP-7385. Remove StringUtils.stringifyException(ie) in logger functions. @@ -4895,14 +4892,14 @@ Release 0.23.0 - 2011-11-01 HADOOP-7451. Generalize StringUtils#join. (Chris Douglas via mattf) - HADOOP-7449. Add Data(In,Out)putByteBuffer to work with ByteBuffer similar + HADOOP-7449. Add Data(In,Out)putByteBuffer to work with ByteBuffer similar to Data(In,Out)putBuffer for byte[]. Merge from yahoo-merge branch, -r 1079163. Fix missing Apache license headers. (Chris Douglas via mattf) HADOOP-7361. Provide an option, -overwrite/-f, in put and copyFromLocal shell commands. (Uma Maheswara Rao G via szetszwo) - HADOOP-7430. Improve error message when moving to trash fails due to + HADOOP-7430. Improve error message when moving to trash fails due to quota issue. (Ravi Prakash via mattf) HADOOP-7444. Add Checksum API to verify and calculate checksums "in bulk" @@ -4912,7 +4909,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7305. Eclipse project files are incomplete. (Niels Basjes via eli) - HADOOP-7314. Add support for throwing UnknownHostException when a host doesn't + HADOOP-7314. Add support for throwing UnknownHostException when a host doesn't resolve. (Jeffrey Naisbitt via jitendra) HADOOP-7465. A several tiny improvements for the LOG format. @@ -4954,7 +4951,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7472. RPC client should deal with IP address change. (Kihwal Lee via suresh) - + HADOOP-7499. Add method for doing a sanity check on hostnames in NetUtils. (Jeffrey Naisbit via mahadev) @@ -4992,7 +4989,7 @@ Release 0.23.0 - 2011-11-01 in the throws clause. (eli) HADOOP-7580. Add a version of getLocalPathForWrite to LocalDirAllocator - which doesn't create dirs. (Chris Douglas & Siddharth Seth via acmurthy) + which doesn't create dirs. (Chris Douglas & Siddharth Seth via acmurthy) HADOOP-7507. Allow ganglia metrics to include the metrics system tags in the gmetric names. (Alejandro Abdelnur via todd) @@ -5013,7 +5010,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7469 Add a standard handler for socket connection problems which improves diagnostics (Uma Maheswara Rao G and stevel via stevel) - HADOOP-7710. Added hadoop-setup-application.sh for creating + HADOOP-7710. Added hadoop-setup-application.sh for creating application directory (Arpit Gupta via Eric Yang) HADOOP-7707. Added toggle for dfs.support.append, webhdfs and hadoop proxy @@ -5030,7 +5027,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7642. create hadoop-dist module where TAR stitching would happen. (Thomas White via tucu) - HADOOP-7709. Running a set of methods in a Single Test Class. + HADOOP-7709. Running a set of methods in a Single Test Class. (Jonathan Eagles via mahadev) HADOOP-7705. Add a log4j back end that can push out JSON data, @@ -5041,10 +5038,10 @@ Release 0.23.0 - 2011-11-01 HADOOP-7762. Common side of MR-2736. (eli) - HADOOP-7668. Add a NetUtils method that can tell if an InetAddress + HADOOP-7668. Add a NetUtils method that can tell if an InetAddress belongs to local host. (suresh) - HADOOP-7509. Improve exception message thrown when Authentication is + HADOOP-7509. Improve exception message thrown when Authentication is required. (Ravi Prakash via suresh) HADOOP-7745. Fix wrong variable name in exception message introduced @@ -5061,10 +5058,10 @@ Release 0.23.0 - 2011-11-01 HADOOP-7782. Aggregate project javadocs. (tomwhite) - HADOOP-7789. Improvements to site navigation. (acmurthy) + HADOOP-7789. Improvements to site navigation. (acmurthy) OPTIMIZATIONS - + HADOOP-7333. Performance improvement in PureJavaCrc32. (Eric Caspole via todd) @@ -5085,7 +5082,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7740. Fixed security audit logger configuration. (Arpit Gupta via Eric Yang) - HADOOP-7630. hadoop-metrics2.properties should have a property *.period + HADOOP-7630. hadoop-metrics2.properties should have a property *.period set to a default value for metrics. (Eric Yang via mattf) HADOOP-7327. FileSystem.listStatus() throws NullPointerException instead of @@ -5095,7 +5092,7 @@ Release 0.23.0 - 2011-11-01 whose entries are changing (e.g. in a multi-thread or multi-process environment). (Sanjay Radia via eli) - HADOOP-7045. TestDU fails on systems with local file systems with + HADOOP-7045. TestDU fails on systems with local file systems with extended attributes. (eli) HADOOP-6939. Inconsistent lock ordering in @@ -5121,13 +5118,13 @@ Release 0.23.0 - 2011-11-01 HADOOP-6912. Guard against NPE when calling UGI.isLoginKeytabBased(). (Kan Zhang via jitendra) - HADOOP-7204. remove local unused fs variable from CmdHandler + HADOOP-7204. remove local unused fs variable from CmdHandler and FsShellPermissions.changePermissions (boryas) HADOOP-7210. Chown command is not working from FSShell (Uma Maheswara Rao G via todd) - HADOOP-7215. RPC clients must use network interface corresponding to + HADOOP-7215. RPC clients must use network interface corresponding to the host in the client's kerberos principal key. (suresh) HADOOP-7019. Refactor build targets to enable faster cross project dev @@ -5148,7 +5145,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7268. FileContext.getLocalFSFileContext() behavior needs to be fixed w.r.t tokens. (jitendra) - HADOOP-7290. Unit test failure in + HADOOP-7290. Unit test failure in TestUserGroupInformation.testGetServerSideGroups. (Trevor Robison via eli) HADOOP-7292. Fix racy test case TestSinkQueue. (Luke Lu via todd) @@ -5159,7 +5156,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7208. Fix implementation of equals() and hashCode() in StandardSocketFactory. (Uma Maheswara Rao G via todd) - HADOOP-7336. TestFileContextResolveAfs will fail with default + HADOOP-7336. TestFileContextResolveAfs will fail with default test.build.data property. (jitendra) HADOOP-7284 Trash and shell's rm does not work for viewfs (Sanjay Radia) @@ -5199,7 +5196,7 @@ Release 0.23.0 - 2011-11-01 HADOOP_CONF_DIR correctly. (Bing Zheng and todd via todd) HADOOP-7448. merge from yahoo-merge branch (via mattf): - -r 1079157: Fix content type for /stacks servlet to be + -r 1079157: Fix content type for /stacks servlet to be plain text (Luke Lu) -r 1079164: No need to escape plain text (Luke Lu) @@ -5220,7 +5217,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7508. Compiled nativelib is in wrong directory and it is not picked up by surefire setup. (Alejandro Abdelnur via tomwhite) - + HADOOP-7520. Fix to add distribution management info to hadoop-main (Alejandro Abdelnur via gkesavan) @@ -5259,7 +5256,7 @@ Release 0.23.0 - 2011-11-01 (Alejandro Abdelnur via tomwhite) HADOOP-7563. Setup HADOOP_HDFS_HOME, HADOOP_MAPRED_HOME and classpath - correction. (Eric Yang via acmurthy) + correction. (Eric Yang via acmurthy) HADOOP-7560. Change src layout to be heirarchical. (Alejandro Abdelnur via acmurthy) @@ -5271,7 +5268,7 @@ Release 0.23.0 - 2011-11-01 (Uma Maheswara Rao G via szetszwo) HADOOP-7598. Fix smart-apply-patch.sh to handle patching from a sub - directory correctly. (Robert Evans via acmurthy) + directory correctly. (Robert Evans via acmurthy) HADOOP-7328. When a serializer class is missing, return null, not throw an NPE. (Harsh J Chouraria via todd) @@ -5298,10 +5295,10 @@ Release 0.23.0 - 2011-11-01 HADOOP-7691. Fixed conflict uid for install packages. (Eric Yang) - HADOOP-7603. Set hdfs, mapred uid, and hadoop uid to fixed numbers. + HADOOP-7603. Set hdfs, mapred uid, and hadoop uid to fixed numbers. (Eric Yang) - HADOOP-7658. Fixed HADOOP_SECURE_DN_USER environment variable in + HADOOP-7658. Fixed HADOOP_SECURE_DN_USER environment variable in hadoop-evn.sh (Eric Yang) HADOOP-7684. Added init.d script for jobhistory server and @@ -5309,7 +5306,7 @@ Release 0.23.0 - 2011-11-01 HADOOP-7715. Removed unnecessary security logger configuration. (Eric Yang) - HADOOP-7685. Improved directory ownership check function in + HADOOP-7685. Improved directory ownership check function in hadoop-setup-conf.sh. (Eric Yang) HADOOP-7711. Fixed recursive sourcing of HADOOP_OPTS environment @@ -5328,24 +5325,24 @@ Release 0.23.0 - 2011-11-01 when running test-patch.sh. (Jonathan Eagles via tomwhite) HADOOP-7744. Ensure failed tests exit with proper error code. (Jonathan - Eagles via acmurthy) + Eagles via acmurthy) - HADOOP-7764. Allow HttpServer to set both ACL list and path spec filters. + HADOOP-7764. Allow HttpServer to set both ACL list and path spec filters. (Jonathan Eagles via acmurthy) - HADOOP-7766. The auth to local mappings are not being respected, with webhdfs + HADOOP-7766. The auth to local mappings are not being respected, with webhdfs and security enabled. (jitendra) - HADOOP-7721. Add log before login in KerberosAuthenticationHandler. + HADOOP-7721. Add log before login in KerberosAuthenticationHandler. (jitendra) HADOOP-7778. FindBugs warning in Token.getKind(). (tomwhite) HADOOP-7798. Add support gpg signatures for maven release artifacts. - (cutting via acmurthy) + (cutting via acmurthy) HADOOP-7797. Fix top-level pom.xml to refer to correct staging maven - repository. (omalley via acmurthy) + repository. (omalley via acmurthy) HADOOP-7101. UserGroupInformation.getCurrentUser() fails when called from non-Hadoop JAAS context. (todd) @@ -5376,8 +5373,8 @@ Release 0.22.0 - 2011-11-29 HADOOP-6791. Refresh for proxy superuser config (common part for HDFS-1096) (boryas) - HADOOP-6581. Add authenticated TokenIdentifiers to UGI so that - they can be used for authorization (Kan Zhang and Jitendra Pandey + HADOOP-6581. Add authenticated TokenIdentifiers to UGI so that + they can be used for authorization (Kan Zhang and Jitendra Pandey via jghoman) HADOOP-6584. Provide Kerberized SSL encryption for webservices. @@ -5385,7 +5382,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-6853. Common component of HDFS-1045. (jghoman) - HADOOP-6859 - Introduce additional statistics to FileSystem to track + HADOOP-6859 - Introduce additional statistics to FileSystem to track file system operations (suresh) HADOOP-6870. Add a new API getFiles to FileSystem and FileContext that @@ -5397,7 +5394,7 @@ Release 0.22.0 - 2011-11-29 file systems associated with a particular UGI. (Devaraj Das and Kan Zhang via szetszwo) - HADOOP-6892. Common component of HDFS-1150 (Verify datanodes' identities + HADOOP-6892. Common component of HDFS-1150 (Verify datanodes' identities to clients in secure clusters) (jghoman) HADOOP-6889. Make RPC to have an option to timeout. (hairong) @@ -5405,10 +5402,10 @@ Release 0.22.0 - 2011-11-29 HADOOP-6996. Allow CodecFactory to return a codec object given a codec' class name. (hairong) - HADOOP-7013. Add boolean field isCorrupt to BlockLocation. + HADOOP-7013. Add boolean field isCorrupt to BlockLocation. (Patrick Kling via hairong) - HADOOP-6978. Adds support for NativeIO using JNI. + HADOOP-6978. Adds support for NativeIO using JNI. (Todd Lipcon, Devaraj Das & Owen O'Malley via ddas) HADOOP-7134. configure files that are generated as part of the released @@ -5416,19 +5413,19 @@ Release 0.22.0 - 2011-11-29 IMPROVEMENTS - HADOOP-6644. util.Shell getGROUPS_FOR_USER_COMMAND method name + HADOOP-6644. util.Shell getGROUPS_FOR_USER_COMMAND method name - should use common naming convention (boryas) - HADOOP-6778. add isRunning() method to + HADOOP-6778. add isRunning() method to AbstractDelegationTokenSecretManager (for HDFS-1044) (boryas) - HADOOP-6633. normalize property names for JT/NN kerberos principal + HADOOP-6633. normalize property names for JT/NN kerberos principal names in configuration (boryas) - HADOOP-6627. "Bad Connection to FS" message in FSShell should print + HADOOP-6627. "Bad Connection to FS" message in FSShell should print message from the exception (boryas) - HADOOP-6600. mechanism for authorization check for inter-server + HADOOP-6600. mechanism for authorization check for inter-server protocols. (boryas) HADOOP-6623. Add StringUtils.split for non-escaped single-character @@ -5440,13 +5437,13 @@ Release 0.22.0 - 2011-11-29 HADOOP-6714. Resolve compressed files using CodecFactory in FsShell::text. (Patrick Angeles via cdouglas) - HADOOP-6661. User document for UserGroupInformation.doAs. + HADOOP-6661. User document for UserGroupInformation.doAs. (Jitendra Pandey via jghoman) HADOOP-6674. Makes use of the SASL authentication options in the SASL RPC. (Jitendra Pandey via ddas) - HADOOP-6526. Need mapping from long principal names to local OS + HADOOP-6526. Need mapping from long principal names to local OS user names. (boryas) HADOOP-6814. Adds an API in UserGroupInformation to get the real @@ -5458,31 +5455,31 @@ Release 0.22.0 - 2011-11-29 HADOOP-6835. Add support for concatenated gzip input. (Greg Roelofs via cdouglas) - HADOOP-6845. Renames the TokenStorage class to Credentials. + HADOOP-6845. Renames the TokenStorage class to Credentials. (Jitendra Pandey via ddas) HADOOP-6826. FileStatus needs unit tests. (Rodrigo Schmidt via Eli Collins) - HADOOP-6905. add buildDTServiceName method to SecurityUtil + HADOOP-6905. add buildDTServiceName method to SecurityUtil (as part of MAPREDUCE-1718) (boryas) HADOOP-6632. Adds support for using different keytabs for different - servers in a Hadoop cluster. In the earier implementation, all servers + servers in a Hadoop cluster. In the earier implementation, all servers of a certain type (like TaskTracker), would have the same keytab and the same principal. Now the principal name is a pattern that has _HOST in it. (Kan Zhang & Jitendra Pandey via ddas) - HADOOP-6861. Adds new non-static methods in Credentials to read and + HADOOP-6861. Adds new non-static methods in Credentials to read and write token storage file. (Jitendra Pandey & Owen O'Malley via ddas) HADOOP-6877. Common part of HDFS-1178 (NameNode servlets should communicate with NameNode directrly). (Kan Zhang via jghoman) - - HADOOP-6475. Adding some javadoc to Server.RpcMetrics, UGI. + + HADOOP-6475. Adding some javadoc to Server.RpcMetrics, UGI. (Jitendra Pandey and borya via jghoman) - HADOOP-6656. Adds a thread in the UserGroupInformation to renew TGTs + HADOOP-6656. Adds a thread in the UserGroupInformation to renew TGTs periodically. (Owen O'Malley and ddas via ddas) HADOOP-6890. Improve listFiles API introduced by HADOOP-6870. (hairong) @@ -5492,7 +5489,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-6911. doc update for DelegationTokenFetcher (boryas) - HADOOP-6900. Make the iterator returned by FileSystem#listLocatedStatus to + HADOOP-6900. Make the iterator returned by FileSystem#listLocatedStatus to throw IOException rather than RuntimeException when there is an IO error fetching the next file. (hairong) @@ -5504,13 +5501,13 @@ Release 0.22.0 - 2011-11-29 HADOOP-6803. Add native gzip read/write coverage to TestCodec. (Eli Collins via tomwhite) - HADOOP-6950. Suggest that HADOOP_CLASSPATH should be preserved in + HADOOP-6950. Suggest that HADOOP_CLASSPATH should be preserved in hadoop-env.sh.template. (Philip Zeyliger via Eli Collins) HADOOP-6922. Make AccessControlList a writable and update documentation for Job ACLs. (Ravi Gummadi via vinodkv) - HADOOP-6965. Introduces checks for whether the original tgt is valid + HADOOP-6965. Introduces checks for whether the original tgt is valid in the reloginFromKeytab method. HADOOP-6856. Simplify constructors for SequenceFile, and MapFile. (omalley) @@ -5531,7 +5528,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-7009. MD5Hash provides a public factory method that creates an instance of thread local MessageDigest. (hairong) - HADOOP-7008. Enable test-patch.sh to have a configured number of + HADOOP-7008. Enable test-patch.sh to have a configured number of acceptable findbugs and javadoc warnings. (nigel and gkesavan) HADOOP-6818. Provides a JNI implementation of group resolution. (ddas) @@ -5550,19 +5547,19 @@ Release 0.22.0 - 2011-11-29 HADOOP-6903. Make AbstractFSileSystem methods and some FileContext methods to be public. (Sanjay Radia) - HADOOP-7034. Add TestPath tests to cover dot, dot dot, and slash + HADOOP-7034. Add TestPath tests to cover dot, dot dot, and slash normalization. (eli) HADOOP-7032. Assert type constraints in the FileStatus constructor. (eli) - HADOOP-6562. FileContextSymlinkBaseTest should use FileContextTestHelper. + HADOOP-6562. FileContextSymlinkBaseTest should use FileContextTestHelper. (eli) - HADOOP-7028. ant eclipse does not include requisite ant.jar in the + HADOOP-7028. ant eclipse does not include requisite ant.jar in the classpath. (Patrick Angeles via eli) HADOOP-6298. Add copyBytes to Text and BytesWritable. (omalley) - + HADOOP-6578. Configuration should trim whitespace around a lot of value types. (Michele Catasta via eli) @@ -5580,7 +5577,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-7110. Implement chmod with JNI. (todd) HADOOP-6812. Change documentation for correct placement of configuration - variables: mapreduce.reduce.input.buffer.percent, + variables: mapreduce.reduce.input.buffer.percent, mapreduce.task.io.sort.factor, mapreduce.task.io.sort.mb (Chris Douglas via shv) @@ -5593,7 +5590,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-7187. Fix socket leak in GangliaContext. (Uma Maheswara Rao G via szetszwo) - HADOOP-7241. fix typo of command 'hadoop fs -help tail'. + HADOOP-7241. fix typo of command 'hadoop fs -help tail'. (Wei Yongjun via eli) HADOOP-7244. Documentation change for updated configuration keys. @@ -5637,17 +5634,17 @@ Release 0.22.0 - 2011-11-29 BUG FIXES - HADOOP-6638. try to relogin in a case of failed RPC connection (expired + HADOOP-6638. try to relogin in a case of failed RPC connection (expired tgt) only in case the subject is loginUser or proxyUgi.realUser. (boryas) HADOOP-6781. security audit log shouldn't have exception in it. (boryas) - HADOOP-6612. Protocols RefreshUserToGroupMappingsProtocol and + HADOOP-6612. Protocols RefreshUserToGroupMappingsProtocol and RefreshAuthorizationPolicyProtocol will fail with security enabled (boryas) HADOOP-6764. Remove verbose logging from the Groups class. (Boris Shkolnik) - HADOOP-6730. Bug in FileContext#copy and provide base class for + HADOOP-6730. Bug in FileContext#copy and provide base class for FileContext tests. (Ravi Phulari via jghoman) HADOOP-6669. Respect compression configuration when creating DefaultCodec @@ -5660,13 +5657,13 @@ Release 0.22.0 - 2011-11-29 glob pattern code less restrictive and more POSIX standard compliant. (Luke Lu via eli) - HADOOP-6649. login object in UGI should be inside the subject (jnp via + HADOOP-6649. login object in UGI should be inside the subject (jnp via boryas) - HADOOP-6687. user object in the subject in UGI should be reused in case + HADOOP-6687. user object in the subject in UGI should be reused in case of a relogin. (jnp via boryas) - HADOOP-6603. Provide workaround for issue with Kerberos not resolving + HADOOP-6603. Provide workaround for issue with Kerberos not resolving cross-realm principal (Kan Zhang and Jitendra Pandey via jghoman) HADOOP-6620. NPE if renewer is passed as null in getDelegationToken. @@ -5678,16 +5675,16 @@ Release 0.22.0 - 2011-11-29 HADOOP-6682. NetUtils:normalizeHostName does not process hostnames starting with [a-f] correctly. (jghoman) - HADOOP-6652. Removes the unnecessary cache from + HADOOP-6652. Removes the unnecessary cache from ShellBasedUnixGroupsMapping. (ddas) - HADOOP-6815. refreshSuperUserGroupsConfiguration should use server side + HADOOP-6815. refreshSuperUserGroupsConfiguration should use server side configuration for the refresh (boryas) HADOOP-6648. Adds a check for null tokens in Credentials.addToken api. (ddas) - - HADOOP-6647. balancer fails with "is not authorized for protocol + + HADOOP-6647. balancer fails with "is not authorized for protocol interface NamenodeProtocol" in secure environment (boryas) HADOOP-6834. TFile.append compares initial key against null lastKey @@ -5699,7 +5696,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-6536. Fixes FileUtil.fullyDelete() not to delete the contents of the sym-linked directory. (Ravi Gummadi via amareshwari) - HADOOP-6873. using delegation token over hftp for long + HADOOP-6873. using delegation token over hftp for long running clients (boryas) HADOOP-6706. Improves the sasl failure handling due to expired tickets, @@ -5708,22 +5705,22 @@ Release 0.22.0 - 2011-11-29 HADOOP-6715. Fixes AccessControlList.toString() to return a descriptive String representation of the ACL. (Ravi Gummadi via amareshwari) - HADOOP-6885. Fix java doc warnings in Groups and - RefreshUserMappingsProtocol. (Eli Collins via jghoman) + HADOOP-6885. Fix java doc warnings in Groups and + RefreshUserMappingsProtocol. (Eli Collins via jghoman) - HADOOP-6482. GenericOptionsParser constructor that takes Options and + HADOOP-6482. GenericOptionsParser constructor that takes Options and String[] ignores options. (Eli Collins via jghoman) HADOOP-6906. FileContext copy() utility doesn't work with recursive copying of directories. (vinod k v via mahadev) - HADOOP-6453. Hadoop wrapper script shouldn't ignore an existing + HADOOP-6453. Hadoop wrapper script shouldn't ignore an existing JAVA_LIBRARY_PATH. (Chad Metcalf via jghoman) - HADOOP-6932. Namenode start (init) fails because of invalid kerberos + HADOOP-6932. Namenode start (init) fails because of invalid kerberos key, even when security set to "simple" (boryas) - HADOOP-6913. Circular initialization between UserGroupInformation and + HADOOP-6913. Circular initialization between UserGroupInformation and KerberosName (Kan Zhang via boryas) HADOOP-6907. Rpc client doesn't use the per-connection conf to figure @@ -5732,10 +5729,10 @@ Release 0.22.0 - 2011-11-29 HADOOP-6938. ConnectionId.getRemotePrincipal() should check if security is enabled. (Kan Zhang via hairong) - HADOOP-6930. AvroRpcEngine doesn't work with generated Avro code. + HADOOP-6930. AvroRpcEngine doesn't work with generated Avro code. (sharad) - HADOOP-6940. RawLocalFileSystem's markSupported method misnamed + HADOOP-6940. RawLocalFileSystem's markSupported method misnamed markSupport. (Tom White via eli). HADOOP-6951. Distinct minicluster services (e.g. NN and JT) overwrite each @@ -5818,7 +5815,7 @@ Release 0.22.0 - 2011-11-29 HADOOP-7126. Fix file permission setting for RawLocalFileSystem on Windows. (Po Cheung via shv) - HADOOP-6642. Fix javac, javadoc, findbugs warnings related to security work. + HADOOP-6642. Fix javac, javadoc, findbugs warnings related to security work. (Chris Douglas, Po Cheung via shv) HADOOP-7140. IPC Reader threads do not stop when server stops (todd) @@ -5905,7 +5902,7 @@ Release 0.21.1 - Unreleased BUG FIXES - HADOOP-6925. BZip2Codec incorrectly implements read(). + HADOOP-6925. BZip2Codec incorrectly implements read(). (Todd Lipcon via Eli Collins) HADOOP-6833. IPC leaks call parameters when exceptions thrown. @@ -5924,7 +5921,7 @@ Release 0.21.1 - Unreleased HADOOP-7052. misspelling of threshold in conf/log4j.properties. (Jingguo Yao via eli) - HADOOP-7053. wrong FSNamesystem Audit logging setting in + HADOOP-7053. wrong FSNamesystem Audit logging setting in conf/log4j.properties. (Jingguo Yao via eli) HADOOP-7120. Fix a syntax error in test-patch.sh. (szetszwo) @@ -5979,13 +5976,13 @@ Release 0.21.0 - 2010-08-13 HADOOP-2827. Remove deprecated NetUtils::getServerAddress. (cdouglas) - HADOOP-5681. Change examples RandomWriter and RandomTextWriter to + HADOOP-5681. Change examples RandomWriter and RandomTextWriter to use new mapreduce API. (Amareshwari Sriramadasu via sharad) - HADOOP-5680. Change org.apache.hadoop.examples.SleepJob to use new + HADOOP-5680. Change org.apache.hadoop.examples.SleepJob to use new mapreduce api. (Amareshwari Sriramadasu via sharad) - HADOOP-5699. Change org.apache.hadoop.examples.PiEstimator to use + HADOOP-5699. Change org.apache.hadoop.examples.PiEstimator to use new mapreduce api. (Amareshwari Sriramadasu via sharad) HADOOP-5720. Introduces new task types - JOB_SETUP, JOB_CLEANUP @@ -5998,22 +5995,22 @@ Release 0.21.0 - 2010-08-13 HADOOP-5738. Split "waiting_tasks" JobTracker metric into waiting maps and waiting reduces. (Sreekanth Ramakrishnan via cdouglas) - HADOOP-5679. Resolve findbugs warnings in core/streaming/pipes/examples. + HADOOP-5679. Resolve findbugs warnings in core/streaming/pipes/examples. (Jothi Padmanabhan via sharad) HADOOP-4359. Support for data access authorization checking on Datanodes. (Kan Zhang via rangadi) - HADOOP-5690. Change org.apache.hadoop.examples.DBCountPageView to use + HADOOP-5690. Change org.apache.hadoop.examples.DBCountPageView to use new mapreduce api. (Amareshwari Sriramadasu via sharad) - HADOOP-5694. Change org.apache.hadoop.examples.dancing to use new + HADOOP-5694. Change org.apache.hadoop.examples.dancing to use new mapreduce api. (Amareshwari Sriramadasu via sharad) - HADOOP-5696. Change org.apache.hadoop.examples.Sort to use new + HADOOP-5696. Change org.apache.hadoop.examples.Sort to use new mapreduce api. (Amareshwari Sriramadasu via sharad) - HADOOP-5698. Change org.apache.hadoop.examples.MultiFileWordCount to + HADOOP-5698. Change org.apache.hadoop.examples.MultiFileWordCount to use new mapreduce api. (Amareshwari Sriramadasu via sharad) HADOOP-5913. Provide ability to an administrator to stop and start @@ -6079,7 +6076,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5258. Add a new DFSAdmin command to print a tree of the rack and datanode topology as seen by the namenode. (Jakob Homan via szetszwo) - + HADOOP-4756. A command line tool to access JMX properties on NameNode and DataNode. (Boris Shkolnik via rangadi) @@ -6108,7 +6105,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5752. Add a new hdfs image processor, Delimited, to oiv. (Jakob Homan via szetszwo) - HADOOP-5266. Adds the capability to do mark/reset of the reduce values + HADOOP-5266. Adds the capability to do mark/reset of the reduce values iterator in the Context object API. (Jothi Padmanabhan via ddas) HADOOP-5745. Allow setting the default value of maxRunningJobs for all @@ -6136,12 +6133,12 @@ Release 0.21.0 - 2010-08-13 (sharad via cutting) HADOOP-6226. Moves BoundedByteArrayOutputStream from the tfile package to - the io package and makes it available to other users (MAPREDUCE-318). + the io package and makes it available to other users (MAPREDUCE-318). (Jothi Padmanabhan via ddas) HADOOP-6105. Adds support for automatically handling deprecation of configuration keys. (V.V.Chaitanya Krishna via yhemanth) - + HADOOP-6235. Adds new method to FileSystem for clients to get server defaults. (Kan Zhang via suresh) @@ -6154,7 +6151,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-4012. Provide splitting support for bzip2 compressed files. (Abdul Qadeer via cdouglas) - HADOOP-6246. Add backward compatibility support to use deprecated decimal + HADOOP-6246. Add backward compatibility support to use deprecated decimal umask from old configuration. (Jakob Homan via suresh) HADOOP-4952. Add new improved file system interface FileContext for the @@ -6192,7 +6189,7 @@ Release 0.21.0 - 2010-08-13 threads. This can be used to delete files in the Distributed Cache. (Zheng Shao via dhruba) - HADOOP-6415. Adds a common token interface for both job token and + HADOOP-6415. Adds a common token interface for both job token and delegation token. (Kan Zhang via ddas) HADOOP-6408. Add a /conf servlet to dump running configuration. @@ -6214,17 +6211,17 @@ Release 0.21.0 - 2010-08-13 (RawLocalFs) that allows local symlinks. (Eli Collins via Sanjay Radia) HADOOP-6577. Add hidden configuration option "ipc.server.max.response.size" - to change the default 1 MB, the maximum size when large IPC handler + to change the default 1 MB, the maximum size when large IPC handler response buffer is reset. (suresh) - HADOOP-6568. Adds authorization for the default servlets. + HADOOP-6568. Adds authorization for the default servlets. (Vinod Kumar Vavilapalli via ddas) HADOOP-6586. Log authentication and authorization failures and successes for RPC (boryas) HADOOP-6580. UGI should contain authentication method. (jnp via boryas) - + HADOOP-6657. Add a capitalization method to StringUtils for MAPREDUCE-1545. (Luke Lu via Steve Loughran) @@ -6260,7 +6257,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5017. Change NameNode.namesystem declaration to private. (szetszwo) HADOOP-4794. Add branch information from the source version control into - the version information that is compiled into Hadoop. (cdouglas via + the version information that is compiled into Hadoop. (cdouglas via omalley) HADOOP-5070. Increment copyright year to 2009, remove assertions of ASF @@ -6271,8 +6268,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-5088. Include releaseaudit target as part of developer test-patch target. (Giridharan Kesavan via nigel) - HADOOP-2721. Uses setsid when creating new tasks so that subprocesses of - this process will be within this new session (and this process will be + HADOOP-2721. Uses setsid when creating new tasks so that subprocesses of + this process will be within this new session (and this process will be the process leader for all the subprocesses). Killing the process leader, or the main Java task in Hadoop's case, kills the entire subtree of processes. (Ravi Gummadi via ddas) @@ -6286,7 +6283,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5124. Choose datanodes randomly instead of starting from the first datanode for providing fairness. (hairong via szetszwo) - HADOOP-4930. Implement a Linux native executable that can be used to + HADOOP-4930. Implement a Linux native executable that can be used to launch tasks as users. (Sreekanth Ramakrishnan via yhemanth) HADOOP-5122. Fix format of fs.default.name value in libhdfs test conf. @@ -6299,7 +6296,7 @@ Release 0.21.0 - 2010-08-13 tools, and example jars. Let findbugs depend on this rather than the 'tar' target. (Giridharan Kesavan via cdouglas) - HADOOP-4868. Splits the hadoop script into three parts - bin/hadoop, + HADOOP-4868. Splits the hadoop script into three parts - bin/hadoop, bin/mapred and bin/hdfs. (Sharad Agarwal via ddas) HADOOP-1722. Adds support for TypedBytes and RawBytes in Streaming. @@ -6308,7 +6305,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-4220. Changes the JobTracker restart tests so that they take much less time. (Amar Kamat via ddas) - HADOOP-4885. Try to restore failed name-node storage directories at + HADOOP-4885. Try to restore failed name-node storage directories at checkpoint time. (Boris Shkolnik via shv) HADOOP-5209. Update year to 2009 for javadoc. (szetszwo) @@ -6316,7 +6313,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5279. Remove unnecessary targets from test-patch.sh. (Giridharan Kesavan via nigel) - HADOOP-5120. Remove the use of FSNamesystem.getFSNamesystem() from + HADOOP-5120. Remove the use of FSNamesystem.getFSNamesystem() from UpgradeManagerNamenode and UpgradeObjectNamenode. (szetszwo) HADOOP-5222. Add offset to datanode clienttrace. (Lei Xu via cdouglas) @@ -6336,8 +6333,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-4546. Fix DF reporting for AIX. (Bill Habermaas via cdouglas) HADOOP-5023. Add Tomcat support to HdfsProxy. (Zhiyong Zhang via cdouglas) - - HADOOP-5317. Provide documentation for LazyOutput Feature. + + HADOOP-5317. Provide documentation for LazyOutput Feature. (Jothi Padmanabhan via johan) HADOOP-5455. Document rpc metrics context to the extent dfs, mapred, and @@ -6347,12 +6344,12 @@ Release 0.21.0 - 2010-08-13 generator. (Jakob Homan via hairong) HADOOP-5442. Paginate jobhistory display and added some search - capabilities. (Amar Kamat via acmurthy) + capabilities. (Amar Kamat via acmurthy) HADOOP-4842. Streaming now allows specifiying a command for the combiner. (Amareshwari Sriramadasu via ddas) - HADOOP-5196. avoiding unnecessary byte[] allocation in + HADOOP-5196. avoiding unnecessary byte[] allocation in SequenceFile.CompressedBytes and SequenceFile.UncompressedBytes. (hong tang via mahadev) @@ -6384,7 +6381,7 @@ Release 0.21.0 - 2010-08-13 (Jakob Homan via shv) HADOOP-5485. Mask actions in the fair scheduler's servlet UI based on - value of webinterface.private.actions. + value of webinterface.private.actions. (Vinod Kumar Vavilapalli via yhemanth) HADOOP-5581. HDFS should throw FileNotFoundException when while opening @@ -6404,7 +6401,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-4490. Provide ability to run tasks as job owners. (Sreekanth Ramakrishnan via yhemanth) - HADOOP-5697. Change org.apache.hadoop.examples.Grep to use new + HADOOP-5697. Change org.apache.hadoop.examples.Grep to use new mapreduce api. (Amareshwari Sriramadasu via sharad) HADOOP-5625. Add operation duration to clienttrace. (Lei Xu via cdouglas) @@ -6424,7 +6421,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5613. Change S3Exception to checked exception. (Andrew Hitchcock via tomwhite) - HADOOP-5717. Create public enum class for the Framework counters in + HADOOP-5717. Create public enum class for the Framework counters in org.apache.hadoop.mapreduce. (Amareshwari Sriramadasu via sharad) HADOOP-5217. Split AllTestDriver for core, hdfs and mapred. (sharad) @@ -6451,8 +6448,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-5080. Add new test cases to TestMRCLI and TestHDFSCLI (V.Karthikeyan via nigel) - HADOOP-5135. Splits the tests into different directories based on the - package. Four new test targets have been defined - run-test-core, + HADOOP-5135. Splits the tests into different directories based on the + package. Four new test targets have been defined - run-test-core, run-test-mapred, run-test-hdfs and run-test-hdfs-with-mr. (Sharad Agarwal via ddas) @@ -6467,7 +6464,7 @@ Release 0.21.0 - 2010-08-13 (Raghu Angadi) HADOOP-5823. Added a new class DeprecatedUTF8 to help with removing - UTF8 related javac warnings. These warnings are removed in + UTF8 related javac warnings. These warnings are removed in FSEditLog.java as a use case. (Raghu Angadi) HADOOP-5824. Deprecate DataTransferProtocol.OP_READ_METADATA and remove @@ -6481,7 +6478,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5854. Fix a few "Inconsistent Synchronization" warnings in HDFS. (Raghu Angadi) - HADOOP-5369. Small tweaks to reduce MapFile index size. (Ben Maurer + HADOOP-5369. Small tweaks to reduce MapFile index size. (Ben Maurer via sharad) HADOOP-5858. Eliminate UTF8 and fix warnings in test/hdfs-with-mr package. @@ -6502,11 +6499,11 @@ Release 0.21.0 - 2010-08-13 HADOOP-5839. Fix EC2 scripts to allow remote job submission. (Joydeep Sen Sarma via tomwhite) - HADOOP-5877. Fix javac warnings in TestHDFSServerPorts, TestCheckpoint, + HADOOP-5877. Fix javac warnings in TestHDFSServerPorts, TestCheckpoint, TestNameEditsConfig, TestStartup and TestStorageRestore. (Jakob Homan via shv) - HADOOP-5438. Provide a single FileSystem method to create or + HADOOP-5438. Provide a single FileSystem method to create or open-for-append to a file. (He Yongqiang via dhruba) HADOOP-5472. Change DistCp to support globbing of input paths. (Dhruba @@ -6520,8 +6517,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-5664. Change map serialization so a lock is obtained only where contention is possible, rather than for each write. (cdouglas) - HADOOP-5896. Remove the dependency of GenericOptionsParser on - Option.withArgPattern. (Giridharan Kesavan and Sharad Agarwal via + HADOOP-5896. Remove the dependency of GenericOptionsParser on + Option.withArgPattern. (Giridharan Kesavan and Sharad Agarwal via sharad) HADOOP-5784. Makes the number of heartbeats that should arrive a second @@ -6530,10 +6527,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-5955. Changes TestFileOuputFormat so that is uses LOCAL_MR instead of CLUSTER_MR. (Jothi Padmanabhan via das) - HADOOP-5948. Changes TestJavaSerialization to use LocalJobRunner + HADOOP-5948. Changes TestJavaSerialization to use LocalJobRunner instead of MiniMR/DFS cluster. (Jothi Padmanabhan via das) - HADOOP-2838. Add mapred.child.env to pass environment variables to + HADOOP-2838. Add mapred.child.env to pass environment variables to tasktracker's child processes. (Amar Kamat via sharad) HADOOP-5961. DataNode process understand generic hadoop command line @@ -6545,13 +6542,13 @@ Release 0.21.0 - 2010-08-13 HADOOP-2141. Improves the speculative execution heuristic. The heuristic is currently based on the progress-rates of tasks and the expected time to complete. Also, statistics about trackers are collected, and speculative - tasks are not given to the ones deduced to be slow. + tasks are not given to the ones deduced to be slow. (Andy Konwinski and ddas) HADOOP-5952. Change "-1 tests included" wording in test-patch.sh. (Gary Murry via szetszwo) - HADOOP-6106. Provides an option in ShellCommandExecutor to timeout + HADOOP-6106. Provides an option in ShellCommandExecutor to timeout commands that do not complete within a certain amount of time. (Sreekanth Ramakrishnan via yhemanth) @@ -6579,8 +6576,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-6160. Fix releaseaudit target to run on specific directories. (gkesavan) - - HADOOP-6169. Removing deprecated method calls in TFile. (hong tang via + + HADOOP-6169. Removing deprecated method calls in TFile. (hong tang via mahadev) HADOOP-6176. Add a couple package private methods to AccessTokenHandler @@ -6611,7 +6608,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6216. Support comments in host files. (Ravi Phulari and Dmytro Molkov via szetszwo) - HADOOP-6217. Update documentation for project split. (Corinne Chandel via + HADOOP-6217. Update documentation for project split. (Corinne Chandel via omalley) HADOOP-6268. Add ivy jar to .gitignore. (Todd Lipcon via cdouglas) @@ -6683,7 +6680,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6435. Make RPC.waitForProxy with timeout public. (Steve Loughran via tomwhite) - + HADOOP-6472. add tokenCache option to GenericOptionsParser for passing file with secret keys to a map reduce job. (boryas) @@ -6705,7 +6702,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6495. Identifier should be serialized after the password is created In Token constructor (jnp via boryas) - HADOOP-6518. Makes the UGI honor the env var KRB5CCNAME. + HADOOP-6518. Makes the UGI honor the env var KRB5CCNAME. (Owen O'Malley via ddas) HADOOP-6531. Enhance FileUtil with an API to delete all contents of a @@ -6720,17 +6717,17 @@ Release 0.21.0 - 2010-08-13 HADOOP-6534. Trim whitespace from directory lists initializing LocalDirAllocator. (Todd Lipcon via cdouglas) - HADOOP-6559. Makes the RPC client automatically re-login when the SASL + HADOOP-6559. Makes the RPC client automatically re-login when the SASL connection setup fails. This is applicable only to keytab based logins. (Devaraj Das) HADOOP-6551. Delegation token renewing and cancelling should provide - meaningful exceptions when there are failures instead of returning + meaningful exceptions when there are failures instead of returning false. (omalley) HADOOP-6583. Captures authentication and authorization metrics. (ddas) - HADOOP-6543. Allows secure clients to talk to unsecure clusters. + HADOOP-6543. Allows secure clients to talk to unsecure clusters. (Kan Zhang via ddas) HADOOP-6579. Provide a mechanism for encoding/decoding Tokens from @@ -6742,7 +6739,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6573. Support for persistent delegation tokens. (Jitendra Pandey via shv) - HADOOP-6594. Provide a fetchdt tool via bin/hdfs. (jhoman via acmurthy) + HADOOP-6594. Provide a fetchdt tool via bin/hdfs. (jhoman via acmurthy) HADOOP-6589. Provide better error messages when RPC authentication fails. (Kan Zhang via omalley) @@ -6750,7 +6747,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6599 Split existing RpcMetrics into RpcMetrics & RpcDetailedMetrics. (Suresh Srinivas via Sanjay Radia) - HADOOP-6537 Declare more detailed exceptions in FileContext and + HADOOP-6537 Declare more detailed exceptions in FileContext and AbstractFileSystem (Suresh Srinivas via Sanjay Radia) HADOOP-6486. fix common classes to work with Avro 1.3 reflection. @@ -6778,10 +6775,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-6658. Exclude Private elements from generated Javadoc. (tomwhite) - HADOOP-6635. Install/deploy source jars to Maven repo. + HADOOP-6635. Install/deploy source jars to Maven repo. (Patrick Angeles via jghoman) - HADOOP-6717. Log levels in o.a.h.security.Groups too high + HADOOP-6717. Log levels in o.a.h.security.Groups too high (Todd Lipcon via jghoman) HADOOP-6667. RPC.waitForProxy should retry through NoRouteToHostException. @@ -6809,10 +6806,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-6403. Deprecate EC2 bash scripts. (tomwhite) - HADOOP-6769. Add an API in FileSystem to get FileSystem instances based + HADOOP-6769. Add an API in FileSystem to get FileSystem instances based on users(ddas via boryas) - HADOOP-6813. Add a new newInstance method in FileSystem that takes + HADOOP-6813. Add a new newInstance method in FileSystem that takes a "user" as argument (ddas via boryas) HADOOP-6668. Apply audience and stability annotations to classes in @@ -6836,10 +6833,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-6166. Further improve the performance of the pure-Java CRC32 implementation. (Tsz Wo (Nicholas), SZE via cdouglas) - HADOOP-6271. Add recursive and non recursive create and mkdir to + HADOOP-6271. Add recursive and non recursive create and mkdir to FileContext. (Sanjay Radia via suresh) - HADOOP-6261. Add URI based tests for FileContext. + HADOOP-6261. Add URI based tests for FileContext. (Ravi Pulari via suresh). HADOOP-6307. Add a new SequenceFile.Reader constructor in order to support @@ -6860,7 +6857,7 @@ Release 0.21.0 - 2010-08-13 BUG FIXES HADOOP-6748. Removes hadoop.cluster.administrators, cluster administrators - acl is passed as parameter in constructor. (amareshwari) + acl is passed as parameter in constructor. (amareshwari) HADOOP-6828. Herrior uses old way of accessing logs directories (Sreekanth Ramakrishnan via cos) @@ -6879,10 +6876,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-4963. Fixes a logging to do with getting the location of map output file. (Amareshwari Sriramadasu via ddas) - HADOOP-2337. Trash should close FileSystem on exit and should not start + HADOOP-2337. Trash should close FileSystem on exit and should not start emtying thread if disabled. (shv) - HADOOP-5072. Fix failure in TestCodec because testSequenceFileGzipCodec + HADOOP-5072. Fix failure in TestCodec because testSequenceFileGzipCodec won't pass without native gzip codec. (Zheng Shao via dhruba) HADOOP-5050. TestDFSShell.testFilePermissions should not assume umask @@ -6924,11 +6921,11 @@ Release 0.21.0 - 2010-08-13 HADOOP-5100. Append, rather than truncate, when creating log4j metrics in Chukwa. (Jerome Boulon via cdouglas) - HADOOP-5204. Fix broken trunk compilation on Hudson by letting + HADOOP-5204. Fix broken trunk compilation on Hudson by letting task-controller be an independent target in build.xml. (Sreekanth Ramakrishnan via yhemanth) - HADOOP-5212. Fix the path translation problem introduced by HADOOP-4868 + HADOOP-5212. Fix the path translation problem introduced by HADOOP-4868 running on cygwin. (Sharad Agarwal via omalley) HADOOP-5226. Add license headers to html and jsp files. (szetszwo) @@ -6937,10 +6934,10 @@ Release 0.21.0 - 2010-08-13 (Jerome Boulon via nigel) HADOOP-4933. Fixes a ConcurrentModificationException problem that shows up - when the history viewer is accessed concurrently. + when the history viewer is accessed concurrently. (Amar Kamat via ddas) - HADOOP-5253. Remove duplicate call to cn-docs target. + HADOOP-5253. Remove duplicate call to cn-docs target. (Giri Kesavan via nigel) HADOOP-5251. Fix classpath for contrib unit tests to include clover jar. @@ -6958,16 +6955,16 @@ Release 0.21.0 - 2010-08-13 HADOOP-5300. Fix ant javadoc-dev target and the typo in the class name NameNodeActivtyMBean. (szetszwo) - HADOOP-5218. libhdfs unit test failed because it was unable to + HADOOP-5218. libhdfs unit test failed because it was unable to start namenode/datanode. Fixed. (dhruba) HADOOP-5273. Add license header to TestJobInProgress.java. (Jakob Homan via szetszwo) - + HADOOP-5229. Remove duplicate version variables in build files (Stefan Groschupf via johan) - HADOOP-5383. Avoid building an unused string in NameNode's + HADOOP-5383. Avoid building an unused string in NameNode's verifyReplication(). (Raghu Angadi) HADOOP-5347. Create a job output directory for the bbp examples. (szetszwo) @@ -6987,7 +6984,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5507. Fix JMXGet javadoc warnings. (Boris Shkolnik via szetszwo) - HADOOP-5191. Accessing HDFS with any ip or hostname should work as long + HADOOP-5191. Accessing HDFS with any ip or hostname should work as long as it points to the interface NameNode is listening on. (Raghu Angadi) HADOOP-5561. Add javadoc.maxmemory parameter to build, preventing OOM @@ -6999,13 +6996,13 @@ Release 0.21.0 - 2010-08-13 HADOOP-5477. Fix rare failure in TestCLI for hosts returning variations of 'localhost'. (Jakob Homan via cdouglas) - HADOOP-5194. Disables setsid for tasks run on cygwin. + HADOOP-5194. Disables setsid for tasks run on cygwin. (Ravi Gummadi via ddas) HADOOP-5322. Fix misleading/outdated comments in JobInProgress. (Amareshwari Sriramadasu via cdouglas) - HADOOP-5198. Fixes a problem to do with the task PID file being absent and + HADOOP-5198. Fixes a problem to do with the task PID file being absent and the JvmManager trying to look for it. (Amareshwari Sriramadasu via ddas) HADOOP-5464. DFSClient did not treat write timeout of 0 properly. @@ -7020,10 +7017,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-5652. Fix a bug where in-memory segments are incorrectly retained in memory. (cdouglas) - HADOOP-5533. Recovery duration shown on the jobtracker webpage is + HADOOP-5533. Recovery duration shown on the jobtracker webpage is inaccurate. (Amar Kamat via sharad) - HADOOP-5647. Fix TestJobHistory to not depend on /tmp. (Ravi Gummadi + HADOOP-5647. Fix TestJobHistory to not depend on /tmp. (Ravi Gummadi via sharad) HADOOP-5661. Fixes some findbugs warnings in o.a.h.mapred* packages and @@ -7068,10 +7065,10 @@ Release 0.21.0 - 2010-08-13 HADOOP-5737. Fixes a problem in the way the JobTracker used to talk to other daemons like the NameNode to get the job's files. Also adds APIs in the JobTracker to get the FileSystem objects as per the JobTracker's - configuration. (Amar Kamat via ddas) + configuration. (Amar Kamat via ddas) - HADOOP-5648. Not able to generate gridmix.jar on the already compiled - version of hadoop. (gkesavan) + HADOOP-5648. Not able to generate gridmix.jar on the already compiled + version of hadoop. (gkesavan) HADOOP-5808. Fix import never used javac warnings in hdfs. (szetszwo) @@ -7092,7 +7089,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5845. Build successful despite test failure on test-core target. (sharad) - HADOOP-5314. Prevent unnecessary saving of the file system image during + HADOOP-5314. Prevent unnecessary saving of the file system image during name-node startup. (Jakob Homan via shv) HADOOP-5855. Fix javac warnings for DisallowedDatanodeException and @@ -7112,7 +7109,7 @@ Release 0.21.0 - 2010-08-13 Srinivas via szetszwo) HADOOP-5801. Fixes the problem: If the hosts file is changed across restart - then it should be refreshed upon recovery so that the excluded hosts are + then it should be refreshed upon recovery so that the excluded hosts are lost and the maps are re-executed. (Amar Kamat via ddas) HADOOP-5841. Resolve findbugs warnings in DistributedFileSystem, @@ -7129,16 +7126,16 @@ Release 0.21.0 - 2010-08-13 HADOOP-5867. Fix javac warnings found in NNBench and NNBenchWithoutMR. (Konstantin Boudnik via szetszwo) - + HADOOP-5728. Fixed FSEditLog.printStatistics IndexOutOfBoundsException. (Wang Xu via johan) - HADOOP-5847. Fixed failing Streaming unit tests (gkesavan) + HADOOP-5847. Fixed failing Streaming unit tests (gkesavan) - HADOOP-5252. Streaming overrides -inputformat option (Klaas Bosteels + HADOOP-5252. Streaming overrides -inputformat option (Klaas Bosteels via sharad) - HADOOP-5710. Counter MAP_INPUT_BYTES missing from new mapreduce api. + HADOOP-5710. Counter MAP_INPUT_BYTES missing from new mapreduce api. (Amareshwari Sriramadasu via sharad) HADOOP-5809. Fix job submission, broken by errant directory creation. @@ -7151,7 +7148,7 @@ Release 0.21.0 - 2010-08-13 in DataBlockScanner. (Kan Zhang via szetszwo) HADOOP-4864. Fixes a problem to do with -libjars with multiple jars when - client and cluster reside on different OSs. (Amareshwari Sriramadasu via + client and cluster reside on different OSs. (Amareshwari Sriramadasu via ddas) HADOOP-5623. Fixes a problem to do with status messages getting overwritten @@ -7160,16 +7157,16 @@ Release 0.21.0 - 2010-08-13 HADOOP-5895. Fixes computation of count of merged bytes for logging. (Ravi Gummadi via ddas) - HADOOP-5805. problem using top level s3 buckets as input/output + HADOOP-5805. problem using top level s3 buckets as input/output directories. (Ian Nowland via tomwhite) - - HADOOP-5940. trunk eclipse-plugin build fails while trying to copy + + HADOOP-5940. trunk eclipse-plugin build fails while trying to copy commons-cli jar from the lib dir (Giridharan Kesavan via gkesavan) HADOOP-5864. Fix DMI and OBL findbugs in packages hdfs and metrics. (hairong) - HADOOP-5935. Fix Hudson's release audit warnings link is broken. + HADOOP-5935. Fix Hudson's release audit warnings link is broken. (Giridharan Kesavan via gkesavan) HADOOP-5947. Delete empty TestCombineFileInputFormat.java @@ -7180,7 +7177,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5944. Add Apache license header to BlockManager.java. (Suresh Srinivas via szetszwo) - HADOOP-5891. SecondaryNamenode is able to converse with the NameNode + HADOOP-5891. SecondaryNamenode is able to converse with the NameNode even when the default value of dfs.http.address is not overridden. (Todd Lipcon via dhruba) @@ -7204,7 +7201,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-5859. Fix "wait() or sleep() with locks held" findbugs warnings in DFSClient. (Kan Zhang via szetszwo) - + HADOOP-5457. Fix to continue to run builds even if contrib test fails (Giridharan Kesavan via gkesavan) @@ -7223,7 +7220,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6031. Remove @author tags from Java source files. (Ravi Phulari via szetszwo) - HADOOP-5980. Fix LinuxTaskController so tasks get passed + HADOOP-5980. Fix LinuxTaskController so tasks get passed LD_LIBRARY_PATH and other environment variables. (Sreekanth Ramakrishnan via yhemanth) @@ -7245,7 +7242,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6114. Fix javadoc documentation for FileStatus.getLen. (Dmitry Rzhevskiy via dhruba) - HADOOP-6131. A sysproperty should not be set unless the property + HADOOP-6131. A sysproperty should not be set unless the property is set on the ant command line in build.xml (hong tang via mahadev) HADOOP-6137. Fix project specific test-patch requirements @@ -7260,21 +7257,21 @@ Release 0.21.0 - 2010-08-13 HADOOP-6123. Add missing classpaths in hadoop-config.sh. (Sharad Agarwal via szetszwo) - HADOOP-6172. Fix jar file names in hadoop-config.sh and include - ${build.src} as a part of the source list in build.xml. (Hong Tang via + HADOOP-6172. Fix jar file names in hadoop-config.sh and include + ${build.src} as a part of the source list in build.xml. (Hong Tang via szetszwo) HADOOP-6124. Fix javac warning detection in test-patch.sh. (Giridharan Kesavan via szetszwo) - HADOOP-6177. FSInputChecker.getPos() would return position greater + HADOOP-6177. FSInputChecker.getPos() would return position greater than the file size. (Hong Tang via hairong) HADOOP-6188. TestTrash uses java.io.File api but not hadoop FileSystem api. (Boris Shkolnik via szetszwo) HADOOP-6192. Fix Shell.getUlimitMemoryCommand to not rely on Map-Reduce - specific configs. (acmurthy) + specific configs. (acmurthy) HADOOP-6103. Clones the classloader as part of Configuration clone. (Amareshwari Sriramadasu via ddas) @@ -7282,7 +7279,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6152. Fix classpath variables in bin/hadoop-config.sh and some other scripts. (Aaron Kimball via szetszwo) - HADOOP-6215. fix GenericOptionParser to deal with -D with '=' in the + HADOOP-6215. fix GenericOptionParser to deal with -D with '=' in the value. (Amar Kamat via sharad) HADOOP-6227. Fix Configuration to allow final parameters to be set to null @@ -7315,19 +7312,19 @@ Release 0.21.0 - 2010-08-13 hadoop-hdfs-hdfwithmr. (Philip Zeyliger via tomwhite) HADOOP-6151. Added a input filter to all of the http servlets that quotes - html characters in the parameters, to prevent cross site scripting + html characters in the parameters, to prevent cross site scripting attacks. (omalley) HADOOP-6274. Fix TestLocalFSFileContextMainOperations test failure. (Gary Murry via suresh). - HADOOP-6281. Avoid null pointer exceptions when the jsps don't have + HADOOP-6281. Avoid null pointer exceptions when the jsps don't have paramaters (omalley) HADOOP-6285. Fix the result type of the getParameterMap method in the HttpServer.QuotingInputFilter. (omalley) - HADOOP-6286. Fix bugs in related to URI handling in glob methods in + HADOOP-6286. Fix bugs in related to URI handling in glob methods in FileContext. (Boris Shkolnik via suresh) HADOOP-6292. Update native libraries guide. (Corinne Chandel via cdouglas) @@ -7341,7 +7338,7 @@ Release 0.21.0 - 2010-08-13 -libjars and -archives options and fix Path to support URI with fragment. (Amareshwari Sriramadasu via szetszwo) - HADOOP-6344. Fix rm and rmr immediately delete files rather than sending + HADOOP-6344. Fix rm and rmr immediately delete files rather than sending to trash, if a user is over-quota. (Jakob Homan via suresh) HADOOP-6347. run-test-core-fault-inject runs a test case twice if @@ -7407,7 +7404,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6521. User specified umask using deprecated dfs.umask must override server configured using new dfs.umaskmode for backward compatibility. (suresh) - + HADOOP-6522. Fix decoding of codepoint zero in UTF8. (cutting) HADOOP-6505. Use tr rather than sed to effect literal substitution in the @@ -7431,7 +7428,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6545. Changes the Key for the FileSystem cache to be UGI (ddas) - HADOOP-6609. Fixed deadlock in RPC by replacing shared static + HADOOP-6609. Fixed deadlock in RPC by replacing shared static DataOutputBuffer in the UTF8 class with a thread local variable. (omalley) HADOOP-6504. Invalid example in the documentation of @@ -7473,7 +7470,7 @@ Release 0.21.0 - 2010-08-13 HADOOP-6710. Symbolic umask for file creation is not conformant with posix. (suresh) - + HADOOP-6719. Insert all missing methods in FilterFs. (Rodrigo Schmidt via dhruba) @@ -7483,12 +7480,12 @@ Release 0.21.0 - 2010-08-13 HADOOP-6722. NetUtils.connect should check that it hasn't connected a socket to itself. (Todd Lipcon via tomwhite) - HADOOP-6634. Fix AccessControlList to use short names to verify access + HADOOP-6634. Fix AccessControlList to use short names to verify access control. (Vinod Kumar Vavilapalli via sharad) HADOOP-6709. Re-instate deprecated FileSystem methods that were removed after 0.20. (tomwhite) - + HADOOP-6630. hadoop-config.sh fails to get executed if hadoop wrapper scripts are in path. (Allen Wittenauer via tomwhite) @@ -7498,8 +7495,8 @@ Release 0.21.0 - 2010-08-13 HADOOP-6727. Remove UnresolvedLinkException from public FileContext APIs. (Eli Collins via tomwhite) - HADOOP-6631. Fix FileUtil.fullyDelete() to continue deleting other files - despite failure at any level. (Contributed by Ravi Gummadi and + HADOOP-6631. Fix FileUtil.fullyDelete() to continue deleting other files + despite failure at any level. (Contributed by Ravi Gummadi and Vinod Kumar Vavilapalli) HADOOP-6723. Unchecked exceptions thrown in IPC Connection should not @@ -7548,7 +7545,7 @@ Release 0.20.3 - Unreleased HADOOP-6760. WebServer shouldn't increase port number in case of negative port setting caused by Jetty's race (cos) - + HADOOP-6881. Make WritableComparator intialize classes when looking for their raw comparator, as classes often register raw comparators in initializers, which are no longer automatically run @@ -7610,7 +7607,7 @@ Release 0.20.2 - 2010-2-16 HADOOP-5612. Some c++ scripts are not chmodded before ant execution. (Todd Lipcon via tomwhite) - HADOOP-1849. Add undocumented configuration parameter for per handler + HADOOP-1849. Add undocumented configuration parameter for per handler call queue size in IPC Server. (shv) Release 0.20.1 - 2009-09-01 @@ -7666,7 +7663,7 @@ Release 0.20.1 - 2009-09-01 HADOOP-5688. Fix HftpFileSystem checksum path construction. (Tsz Wo (Nicholas) Sze via cdouglas) - HADOOP-4674. Fix fs help messages for -test, -text, -tail, -stat + HADOOP-4674. Fix fs help messages for -test, -text, -tail, -stat and -touchz options. (Ravi Phulari via szetszwo) HADOOP-5718. Remove the check for the default queue in capacity scheduler. @@ -7684,7 +7681,7 @@ Release 0.20.1 - 2009-09-01 is of an unknown size. (Vinod Kumar Vavilapalli via ddas) HADOOP-5636. Prevents a job from going to RUNNING state after it has been - KILLED (this used to happen when the SetupTask would come back with a + KILLED (this used to happen when the SetupTask would come back with a success after the job has been killed). (Amar Kamat via ddas) HADOOP-5641. Fix a NullPointerException in capacity scheduler's memory @@ -7693,7 +7690,7 @@ Release 0.20.1 - 2009-09-01 HADOOP-5828. Use absolute path for mapred.local.dir of JobTracker in MiniMRCluster. (yhemanth) - HADOOP-4981. Fix capacity scheduler to schedule speculative tasks + HADOOP-4981. Fix capacity scheduler to schedule speculative tasks correctly in the presence of High RAM jobs. (Sreekanth Ramakrishnan via yhemanth) @@ -7718,11 +7715,11 @@ Release 0.20.1 - 2009-09-01 available memory on a tasktracker. (Vinod Kumar Vavilapalli via yhemanth) - HADOOP-5908. Fixes a problem to do with ArithmeticException in the + HADOOP-5908. Fixes a problem to do with ArithmeticException in the JobTracker when there are jobs with 0 maps. (Amar Kamat via ddas) HADOOP-5924. Fixes a corner case problem to do with job recovery with - empty history files. Also, after a JT restart, sends KillTaskAction to + empty history files. Also, after a JT restart, sends KillTaskAction to tasks that report back but the corresponding job hasn't been initialized yet. (Amar Kamat via ddas) @@ -7730,7 +7727,7 @@ Release 0.20.1 - 2009-09-01 api. (Amareshwari Sriramadasu via sharad) HADOOP-5746. Fixes a corner case problem in Streaming, where if an exception - happens in MROutputThread after the last call to the map/reduce method, the + happens in MROutputThread after the last call to the map/reduce method, the exception goes undetected. (Amar Kamat via ddas) HADOOP-5884. Fixes accounting in capacity scheduler so that high RAM jobs @@ -7744,12 +7741,12 @@ Release 0.20.1 - 2009-09-01 (Sreekanth Ramakrishnan via yhemanth) HADOOP-5921. Fixes a problem in the JobTracker where it sometimes never used - to come up due to a system file creation on JobTracker's system-dir failing. - This problem would sometimes show up only when the FS for the system-dir - (usually HDFS) is started at nearly the same time as the JobTracker. + to come up due to a system file creation on JobTracker's system-dir failing. + This problem would sometimes show up only when the FS for the system-dir + (usually HDFS) is started at nearly the same time as the JobTracker. (Amar Kamat via ddas) - HADOOP-5920. Fixes a testcase failure for TestJobHistory. + HADOOP-5920. Fixes a testcase failure for TestJobHistory. (Amar Kamat via ddas) HADOOP-6139. Fix the FsShell help messages for rm and rmr. (Jakob Homan @@ -7769,11 +7766,11 @@ Release 0.20.0 - 2009-04-15 classes. Removed public, static ID::read and ID::forName; made ID an abstract class. (Suresh Srinivas via cdouglas) - HADOOP-4253. Fix various warnings generated by findbugs. + HADOOP-4253. Fix various warnings generated by findbugs. Following deprecated methods in RawLocalFileSystem are removed: public String getName() public void lock(Path p, boolean shared) - public void release(Path p) + public void release(Path p) (Suresh Srinivas via johan) HADOOP-4618. Move http server from FSNamesystem into NameNode. @@ -7786,7 +7783,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4567. GetFileBlockLocations returns the NetworkTopology information of the machines where the blocks reside. (dhruba) - HADOOP-4435. The JobTracker WebUI displays the amount of heap memory + HADOOP-4435. The JobTracker WebUI displays the amount of heap memory in use. (dhruba) HADOOP-4628. Move Hive into a standalone subproject. (omalley) @@ -7820,7 +7817,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-3344. Fix libhdfs build to use autoconf and build the same architecture (32 vs 64 bit) of the JVM running Ant. The libraries for - pipes, utils, and libhdfs are now all in c++//lib. + pipes, utils, and libhdfs are now all in c++//lib. (Giridharan Kesavan via nigel) HADOOP-4874. Remove LZO codec because of licensing issues. (omalley) @@ -7828,7 +7825,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4970. The full path name of a file is preserved inside Trash. (Prasad Chakka via dhruba) - HADOOP-4103. NameNode keeps a count of missing blocks. It warns on + HADOOP-4103. NameNode keeps a count of missing blocks. It warns on WebUI if there are such blocks. '-report' and '-metaSave' have extra info to track such blocks. (Raghu Angadi) @@ -7850,9 +7847,9 @@ Release 0.20.0 - 2009-04-15 by Chukwa) Added FileAdaptor for streaming small file in one chunk Added compression to archive and demux output - Added unit tests and validation for agent, collector, and demux map + Added unit tests and validation for agent, collector, and demux map reduce job - Added database loader for loading demux output (sequence file) to jdbc + Added database loader for loading demux output (sequence file) to jdbc connected database Added algorithm to distribute collector load more evenly (Jerome Boulon, Eric Yang, Andy Konwinski, Ariel Rabkin via cdouglas) @@ -7864,7 +7861,7 @@ Release 0.20.0 - 2009-04-15 move DataNode information to a separated page. (Boris Shkolnik via szetszwo) - HADOOP-4348. Add service-level authorization for Hadoop. (acmurthy) + HADOOP-4348. Add service-level authorization for Hadoop. (acmurthy) HADOOP-4826. Introduce admin command saveNamespace. (shv) @@ -7872,7 +7869,7 @@ Release 0.20.0 - 2009-04-15 populated key space (Andrzej Bialecki via stack) HADOOP-1230. Add new map/reduce API and deprecate the old one. Generally, - the old code should work without problem. The new api is in + the old code should work without problem. The new api is in org.apache.hadoop.mapreduce and the old classes in org.apache.hadoop.mapred are deprecated. Differences in the new API: 1. All of the methods take Context objects that allow us to add new @@ -7883,30 +7880,30 @@ Release 0.20.0 - 2009-04-15 3. Mapper and Reducer by default are Identity Mapper and Reducer. 4. The FileOutputFormats use part-r-00000 for the output of reduce 0 and part-m-00000 for the output of map 0. - 5. The reduce grouping comparator now uses the raw compare instead of + 5. The reduce grouping comparator now uses the raw compare instead of object compare. 6. The number of maps in FileInputFormat is controlled by min and max split size rather than min size and the desired number of maps. (omalley) - + HADOOP-3305. Use Ivy to manage dependencies. (Giridharan Kesavan and Steve Loughran via cutting) IMPROVEMENTS - HADOOP-4749. Added a new counter REDUCE_INPUT_BYTES. (Yongqiang He via + HADOOP-4749. Added a new counter REDUCE_INPUT_BYTES. (Yongqiang He via zshao) HADOOP-4234. Fix KFS "glue" layer to allow applications to interface with multiple KFS metaservers. (Sriram Rao via lohit) - HADOOP-4245. Update to latest version of KFS "glue" library jar. + HADOOP-4245. Update to latest version of KFS "glue" library jar. (Sriram Rao via lohit) HADOOP-4244. Change test-patch.sh to check Eclipse classpath no matter it is run by Hudson or not. (szetszwo) - HADOOP-3180. Add name of missing class to WritableName.getClass + HADOOP-3180. Add name of missing class to WritableName.getClass IOException. (Pete Wyckoff via omalley) HADOOP-4178. Make the capacity scheduler's default values configurable. @@ -7917,14 +7914,14 @@ Release 0.20.0 - 2009-04-15 HADOOP-4226. Refactor and document LineReader to make it more readily understandable. (Yuri Pradkin via cdouglas) - - HADOOP-4238. When listing jobs, if scheduling information isn't available + + HADOOP-4238. When listing jobs, if scheduling information isn't available print NA instead of empty output. (Sreekanth Ramakrishnan via johan) HADOOP-4284. Support filters that apply to all requests, or global filters, to HttpServer. (Kan Zhang via cdouglas) - - HADOOP-4276. Improve the hashing functions and deserialization of the + + HADOOP-4276. Improve the hashing functions and deserialization of the mapred ID classes. (omalley) HADOOP-4485. Add a compile-native ant task, as a shorthand. (enis) @@ -7933,13 +7930,13 @@ Release 0.20.0 - 2009-04-15 HADOOP-3461. Remove hdfs.StringBytesWritable. (szetszwo) - HADOOP-4437. Use Halton sequence instead of java.util.Random in + HADOOP-4437. Use Halton sequence instead of java.util.Random in PiEstimator. (szetszwo) - HADOOP-4572. Change INode and its sub-classes to package private. + HADOOP-4572. Change INode and its sub-classes to package private. (szetszwo) - HADOOP-4187. Does a runtime lookup for JobConf/JobConfigurable, and if + HADOOP-4187. Does a runtime lookup for JobConf/JobConfigurable, and if found, invokes the appropriate configure method. (Sharad Agarwal via ddas) HADOOP-4453. Improve ssl configuration and handling in HsftpFileSystem, @@ -7949,10 +7946,10 @@ Release 0.20.0 - 2009-04-15 szetszwo) HADOOP-3923. Remove org.apache.hadoop.mapred.StatusHttpServer. (szetszwo) - + HADOOP-4622. Explicitly specify interpretor for non-native pipes binaries. (Fredrik Hedberg via johan) - + HADOOP-4505. Add a unit test to test faulty setup task and cleanup task killing the job. (Amareshwari Sriramadasu via johan) @@ -7976,9 +7973,9 @@ Release 0.20.0 - 2009-04-15 HADOOP-4640. Adds an input format that can split lzo compressed text files. (johan) - - HADOOP-4666. Launch reduces only after a few maps have run in the - Fair Scheduler. (Matei Zaharia via johan) + + HADOOP-4666. Launch reduces only after a few maps have run in the + Fair Scheduler. (Matei Zaharia via johan) HADOOP-4339. Remove redundant calls from FileSystem/FsShell when generating/processing ContentSummary. (David Phillips via cdouglas) @@ -8033,24 +8030,24 @@ Release 0.20.0 - 2009-04-15 (Boris Shkolnik via cdouglas) HADOOP-4807. Adds JobClient commands to get the active/blacklisted tracker - names. Also adds commands to display running/completed task attempt IDs. + names. Also adds commands to display running/completed task attempt IDs. (ddas) HADOOP-4699. Remove checksum validation from map output servlet. (cdouglas) HADOOP-4838. Added a registry to automate metrics and mbeans management. - (Sanjay Radia via acmurthy) + (Sanjay Radia via acmurthy) - HADOOP-3136. Fixed the default scheduler to assign multiple tasks to each - tasktracker per heartbeat, when feasible. To ensure locality isn't hurt - too badly, the scheudler will not assign more than one off-switch task per - heartbeat. The heartbeat interval is also halved since the task-tracker is - fixed to no longer send out heartbeats on each task completion. A - slow-start for scheduling reduces is introduced to ensure that reduces - aren't started till sufficient number of maps are done, else reduces of + HADOOP-3136. Fixed the default scheduler to assign multiple tasks to each + tasktracker per heartbeat, when feasible. To ensure locality isn't hurt + too badly, the scheudler will not assign more than one off-switch task per + heartbeat. The heartbeat interval is also halved since the task-tracker is + fixed to no longer send out heartbeats on each task completion. A + slow-start for scheduling reduces is introduced to ensure that reduces + aren't started till sufficient number of maps are done, else reduces of jobs whose maps aren't scheduled might swamp the cluster. Configuration changes to mapred-default.xml: - add mapred.reduce.slowstart.completed.maps + add mapred.reduce.slowstart.completed.maps (acmurthy) HADOOP-4545. Add example and test case of secondary sort for the reduce. @@ -8069,14 +8066,14 @@ Release 0.20.0 - 2009-04-15 HADOOP-4830. Add end-to-end test cases for testing queue capacities. (Vinod Kumar Vavilapalli via yhemanth) - HADOOP-4980. Improve code layout of capacity scheduler to make it + HADOOP-4980. Improve code layout of capacity scheduler to make it easier to fix some blocker bugs. (Vivek Ratan via yhemanth) HADOOP-4916. Make user/location of Chukwa installation configurable by an external properties file. (Eric Yang via cdouglas) - HADOOP-4950. Make the CompressorStream, DecompressorStream, - BlockCompressorStream, and BlockDecompressorStream public to facilitate + HADOOP-4950. Make the CompressorStream, DecompressorStream, + BlockCompressorStream, and BlockDecompressorStream public to facilitate non-Hadoop codecs. (omalley) HADOOP-4843. Collect job history and configuration in Chukwa. (Eric Yang @@ -8084,11 +8081,11 @@ Release 0.20.0 - 2009-04-15 HADOOP-5030. Build Chukwa RPM to install into configured directory. (Eric Yang via cdouglas) - + HADOOP-4828. Updates documents to do with configuration (HADOOP-4631). (Sharad Agarwal via ddas) - HADOOP-4939. Adds a test that would inject random failures for tasks in + HADOOP-4939. Adds a test that would inject random failures for tasks in large jobs and would also inject TaskTracker failures. (ddas) HADOOP-4944. A configuration file can include other configuration @@ -8100,7 +8097,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-5248. A testcase that checks for the existence of job directory after the job completes. Fails if it exists. (ddas) - HADOOP-4664. Introduces multiple job initialization threads, where the + HADOOP-4664. Introduces multiple job initialization threads, where the number of threads are configurable via mapred.jobinit.threads. (Matei Zaharia and Jothi Padmanabhan via ddas) @@ -8117,7 +8114,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-5437. Fix TestMiniMRDFSSort to properly test jvm-reuse. (omalley) - HADOOP-5521. Removes dependency of TestJobInProgress on RESTART_COUNT + HADOOP-5521. Removes dependency of TestJobInProgress on RESTART_COUNT JobHistory tag. (Ravi Gummadi via ddas) OPTIMIZATIONS @@ -8144,7 +8141,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4408. FsAction functions need not create new objects. (cdouglas) - HADOOP-4440. TestJobInProgressListener tests for jobs killed in queued + HADOOP-4440. TestJobInProgressListener tests for jobs killed in queued state (Amar Kamat via ddas) HADOOP-4346. Implement blocking connect so that Hadoop is not affected @@ -8225,10 +8222,10 @@ Release 0.20.0 - 2009-04-15 HADOOP-4623. Maintain running tasks even if speculative execution is off. (Amar Kamat via yhemanth) - HADOOP-4786. Fix broken compilation error in + HADOOP-4786. Fix broken compilation error in TestTrackerBlacklistAcrossJobs. (yhemanth) - HADOOP-4785. Fixes theJobTracker heartbeat to not make two calls to + HADOOP-4785. Fixes theJobTracker heartbeat to not make two calls to System.currentTimeMillis(). (Amareshwari Sriramadasu via ddas) HADOOP-4792. Add generated Chukwa configuration files to version control @@ -8252,7 +8249,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4844. Fixed javadoc for org.apache.hadoop.fs.permission.AccessControlException to document that it's deprecated in favour of - org.apache.hadoop.security.AccessControlException. (acmurthy) + org.apache.hadoop.security.AccessControlException. (acmurthy) HADOOP-4706. Close the underlying output stream in IFileOutputStream::close. (Jothi Padmanabhan via cdouglas) @@ -8279,12 +8276,12 @@ Release 0.20.0 - 2009-04-15 (Amareshwari Sriramadasu via cdouglas) HADOOP-4879. Fix org.apache.hadoop.mapred.Counters to correctly define - Object.equals rather than depend on contentEquals api. (omalley via + Object.equals rather than depend on contentEquals api. (omalley via acmurthy) HADOOP-4791. Fix rpm build process for Chukwa. (Eric Yang via cdouglas) - HADOOP-4771. Correct initialization of the file count for directories + HADOOP-4771. Correct initialization of the file count for directories with quotas. (Ruyue Ma via shv) HADOOP-4878. Fix eclipse plugin classpath file to point to ivy's resolved @@ -8311,7 +8308,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4889. Fix permissions in RPM packaging. (Eric Yang via cdouglas) - HADOOP-4869. Fixes the TT-JT heartbeat to have an explicit flag for + HADOOP-4869. Fixes the TT-JT heartbeat to have an explicit flag for restart apart from the initialContact flag that there was earlier. (Amareshwari Sriramadasu via ddas) @@ -8323,18 +8320,18 @@ Release 0.20.0 - 2009-04-15 HADOOP-4924. Fixes a race condition in TaskTracker re-init. (ddas) - HADOOP-4854. Read reclaim capacity interval from capacity scheduler + HADOOP-4854. Read reclaim capacity interval from capacity scheduler configuration. (Sreekanth Ramakrishnan via yhemanth) HADOOP-4896. HDFS Fsck does not load HDFS configuration. (Raghu Angadi) - HADOOP-4956. Creates TaskStatus for failed tasks with an empty Counters + HADOOP-4956. Creates TaskStatus for failed tasks with an empty Counters object instead of null. (ddas) HADOOP-4979. Fix capacity scheduler to block cluster for failed high RAM requirements across task types. (Vivek Ratan via yhemanth) - HADOOP-4949. Fix native compilation. (Chris Douglas via acmurthy) + HADOOP-4949. Fix native compilation. (Chris Douglas via acmurthy) HADOOP-4787. Fixes the testcase TestTrackerBlacklistAcrossJobs which was earlier failing randomly. (Amareshwari Sriramadasu via ddas) @@ -8360,7 +8357,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-4988. Fix reclaim capacity to work even when there are queues with no capacity. (Vivek Ratan via yhemanth) - HADOOP-5065. Remove generic parameters from argument to + HADOOP-5065. Remove generic parameters from argument to setIn/OutputFormatClass so that it works with SequenceIn/OutputFormat. (cdouglas via omalley) @@ -8371,7 +8368,7 @@ Release 0.20.0 - 2009-04-15 more modular and testable. (Ari Rabkin via cdouglas) HADOOP-5048. Fix capacity scheduler to correctly cleanup jobs that are - killed after initialization, but before running. + killed after initialization, but before running. (Sreekanth Ramakrishnan via yhemanth) HADOOP-4671. Mark loop control variables shared between threads as @@ -8380,10 +8377,10 @@ Release 0.20.0 - 2009-04-15 HADOOP-5079. HashFunction inadvertently destroys some randomness (Jonathan Ellis via stack) - HADOOP-4999. A failure to write to FsEditsLog results in + HADOOP-4999. A failure to write to FsEditsLog results in IndexOutOfBounds exception. (Boris Shkolnik via rangadi) - HADOOP-5139. Catch IllegalArgumentException during metrics registration + HADOOP-5139. Catch IllegalArgumentException during metrics registration in RPC. (Hairong Kuang via szetszwo) HADOOP-5085. Copying a file to local with Crc throws an exception. @@ -8401,9 +8398,9 @@ Release 0.20.0 - 2009-04-15 HADOOP-5255. Fix use of Math.abs to avoid overflow. (Jonathan Ellis via cdouglas) - HADOOP-5269. Fixes a problem to do with tasktracker holding on to + HADOOP-5269. Fixes a problem to do with tasktracker holding on to FAILED_UNCLEAN or KILLED_UNCLEAN tasks forever. (Amareshwari Sriramadasu - via ddas) + via ddas) HADOOP-5214. Fixes a ConcurrentModificationException while the Fairshare Scheduler accesses the tasktrackers stored by the JobTracker. @@ -8411,12 +8408,12 @@ Release 0.20.0 - 2009-04-15 HADOOP-5233. Addresses the three issues - Race condition in updating status, NPE in TaskTracker task localization when the conf file is missing - (HADOOP-5234) and NPE in handling KillTaskAction of a cleanup task + (HADOOP-5234) and NPE in handling KillTaskAction of a cleanup task (HADOOP-5235). (Amareshwari Sriramadasu via ddas) HADOOP-5247. Introduces a broadcast of KillJobAction to all trackers when - a job finishes. This fixes a bunch of problems to do with NPE when a - completed job is not in memory and a tasktracker comes to the jobtracker + a job finishes. This fixes a bunch of problems to do with NPE when a + completed job is not in memory and a tasktracker comes to the jobtracker with a status report of a task belonging to that job. (Amar Kamat via ddas) HADOOP-5282. Fixed job history logs for task attempts that are @@ -8427,7 +8424,7 @@ Release 0.20.0 - 2009-04-15 the estimation formula linear where blowUp = Total-Output/Total-Input. (Sharad Agarwal via ddas) - HADOOP-5142. Fix MapWritable#putAll to store key/value classes. + HADOOP-5142. Fix MapWritable#putAll to store key/value classes. (Do??acan G??ney via enis) HADOOP-4744. Workaround for jetty6 returning -1 when getLocalPort @@ -8442,7 +8439,7 @@ Release 0.20.0 - 2009-04-15 attempt is the first attempt of a Task. This affects JobTracker restart. (Amar Kamat via ddas) - HADOOP-5306. Fixes a problem to do with logging/parsing the http port of a + HADOOP-5306. Fixes a problem to do with logging/parsing the http port of a lost tracker. Affects JobTracker restart. (Amar Kamat via ddas) HADOOP-5111. Fix Job::set* methods to work with generics. (cdouglas) @@ -8458,16 +8455,16 @@ Release 0.20.0 - 2009-04-15 tasktrackers. (Amar Kamat via yhemanth) HADOOP-4695. Change TestGlobalFilter so that it allows a web page to be - filtered more than once for a single access. (Kan Zhang via szetszwo) + filtered more than once for a single access. (Kan Zhang via szetszwo) HADOOP-5298. Change TestServletFilter so that it allows a web page to be - filtered more than once for a single access. (szetszwo) + filtered more than once for a single access. (szetszwo) HADOOP-5432. Disable ssl during unit tests in hdfsproxy, as it is unused and causes failures. (cdouglas) HADOOP-5416. Correct the shell command "fs -test" forrest doc description. - (Ravi Phulari via szetszwo) + (Ravi Phulari via szetszwo) HADOOP-5327. Fixed job tracker to remove files from system directory on ACL check failures and also check ACLs on restart. @@ -8501,7 +8498,7 @@ Release 0.20.0 - 2009-04-15 Padmanabhan via ddas) HADOOP-5483. Fixes a problem in the Directory Cleanup Thread due to which - TestMiniMRWithDFS sometimes used to fail. (ddas) + TestMiniMRWithDFS sometimes used to fail. (ddas) HADOOP-5281. Prevent sharing incompatible ZlibCompressor instances between GzipCodec and DefaultCodec. (cdouglas) @@ -8518,16 +8515,16 @@ Release 0.20.0 - 2009-04-15 HADOOP-5382. Support combiners in the new context object API. (omalley) - HADOOP-5471. Fixes a problem to do with updating the log.index file in the + HADOOP-5471. Fixes a problem to do with updating the log.index file in the case where a cleanup task is run. (Amareshwari Sriramadasu via ddas) HADOOP-5534. Fixed a deadlock in Fair scheduler's servlet. (Rahul Kumar Singh via yhemanth) - HADOOP-5328. Fixes a problem in the renaming of job history files during + HADOOP-5328. Fixes a problem in the renaming of job history files during job recovery. (Amar Kamat via ddas) - HADOOP-5417. Don't ignore InterruptedExceptions that happen when calling + HADOOP-5417. Don't ignore InterruptedExceptions that happen when calling into rpc. (omalley) HADOOP-5320. Add a close() in TestMapReduceLocal. (Jothi Padmanabhan @@ -8584,7 +8581,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-5337. JobTracker, upon restart, now waits for the TaskTrackers to join back before scheduling new tasks. This fixes race conditions associated - with greedy scheduling as was the case earlier. (Amar Kamat via ddas) + with greedy scheduling as was the case earlier. (Amar Kamat via ddas) HADOOP-5227. Fix distcp so -update and -delete can be meaningfully combined. (Tsz Wo (Nicholas), SZE via cdouglas) @@ -8604,7 +8601,7 @@ Release 0.20.0 - 2009-04-15 HADOOP-5585. Clear FileSystem statistics between tasks when jvm-reuse is enabled. (omalley) - HADOOP-5394. JobTracker might schedule 2 attempts of the same task + HADOOP-5394. JobTracker might schedule 2 attempts of the same task with the same attempt id across restarts. (Amar Kamat via sharad) HADOOP-5645. After HADOOP-4920 we need a place to checkin @@ -8614,9 +8611,9 @@ Release 0.19.2 - 2009-06-30 BUG FIXES - HADOOP-5154. Fixes a deadlock in the fairshare scheduler. + HADOOP-5154. Fixes a deadlock in the fairshare scheduler. (Matei Zaharia via yhemanth) - + HADOOP-5146. Fixes a race condition that causes LocalDirAllocator to miss files. (Devaraj Das via yhemanth) @@ -8632,7 +8629,7 @@ Release 0.19.2 - 2009-06-30 HADOOP-5285. Fixes the issues - (1) obtainTaskCleanupTask checks whether job is inited before trying to lock the JobInProgress (2) Moves the CleanupQueue class - outside the TaskTracker and makes it a generic class that is used by the + outside the TaskTracker and makes it a generic class that is used by the JobTracker also for deleting the paths on the job's output fs. (3) Moves the references to completedJobStore outside the block where the JobTracker is locked. (ddas) @@ -8650,16 +8647,16 @@ Release 0.19.2 - 2009-06-30 HADOOP-5440. Fixes a problem to do with removing a taskId from the list of taskIds that the TaskTracker's TaskMemoryManager manages. (Amareshwari Sriramadasu via ddas) - + HADOOP-5446. Restore TaskTracker metrics. (cdouglas) - HADOOP-5449. Fixes the history cleaner thread. + HADOOP-5449. Fixes the history cleaner thread. (Amareshwari Sriramadasu via ddas) HADOOP-5479. NameNode should not send empty block replication request to DataNode. (hairong) - HADOOP-5259. Job with output hdfs:/user//outputpath (no + HADOOP-5259. Job with output hdfs:/user//outputpath (no authority) fails with Wrong FS. (Doug Cutting via hairong) HADOOP-5522. Documents the setup/cleanup tasks in the mapred tutorial. @@ -8689,7 +8686,7 @@ Release 0.19.2 - 2009-06-30 HADOOP-5671. Fix FNF exceptions when copying from old versions of HftpFileSystem. (Tsz Wo (Nicholas), SZE via cdouglas) - HADOOP-5213. Fix Null pointer exception caused when bzip2compression + HADOOP-5213. Fix Null pointer exception caused when bzip2compression was used and user closed a output stream without writing any data. (Zheng Shao via dhruba) @@ -8702,7 +8699,7 @@ Release 0.19.2 - 2009-06-30 HADOOP-5951. Add Apache license header to StorageInfo.java. (Suresh Srinivas via szetszwo) -Release 0.19.1 - 2009-02-23 +Release 0.19.1 - 2009-02-23 IMPROVEMENTS @@ -8741,7 +8738,7 @@ Release 0.19.1 - 2009-02-23 HADOOP-4847. Moves the loading of OutputCommitter to the Task. (Amareshwari Sriramadasu via ddas) - HADOOP-4966. Marks completed setup tasks for removal. + HADOOP-4966. Marks completed setup tasks for removal. (Amareshwari Sriramadasu via ddas) HADOOP-4982. TestFsck should run in Eclipse. (shv) @@ -8750,7 +8747,7 @@ Release 0.19.1 - 2009-02-23 fd unclosed. (hairong) HADOOP-4906. Fix TaskTracker OOM by keeping a shallow copy of JobConf in - TaskTracker.TaskInProgress. (Sharad Agarwal via acmurthy) + TaskTracker.TaskInProgress. (Sharad Agarwal via acmurthy) HADOOP-4918. Fix bzip2 compression to work with Sequence Files. (Zheng Shao via dhruba). @@ -8764,12 +8761,12 @@ Release 0.19.1 - 2009-02-23 verification log unclosed. (hairong) HADOOP-5086. Use the appropriate FileSystem for trash URIs. (cdouglas) - + HADOOP-4955. Make DBOutputFormat us column names from setOutput(). - (Kevin Peterson via enis) + (Kevin Peterson via enis) - HADOOP-4862. Minor : HADOOP-3678 did not remove all the cases of - spurious IOExceptions logged by DataNode. (Raghu Angadi) + HADOOP-4862. Minor : HADOOP-3678 did not remove all the cases of + spurious IOExceptions logged by DataNode. (Raghu Angadi) HADOOP-5034. NameNode should send both replication and deletion requests to DataNode in one reply to a heartbeat. (hairong) @@ -8792,14 +8789,14 @@ Release 0.19.1 - 2009-02-23 HADOOP-5067. Fixes TaskInProgress.java to keep track of count of failed and killed tasks correctly. (Amareshwari Sriramadasu via ddas) - HADOOP-4760. HDFS streams should not throw exceptions when closed twice. + HADOOP-4760. HDFS streams should not throw exceptions when closed twice. (enis) Release 0.19.0 - 2008-11-18 INCOMPATIBLE CHANGES - HADOOP-3595. Remove deprecated methods for mapred.combine.once + HADOOP-3595. Remove deprecated methods for mapred.combine.once functionality, which was necessary to providing backwards compatible combiner semantics for 0.18. (cdouglas via omalley) @@ -8818,8 +8815,8 @@ Release 0.19.0 - 2008-11-18 (Amareshwari Sriramadasu via cdouglas) HADOOP-2885. Break the hadoop.dfs package into separate packages under - hadoop.hdfs that reflect whether they are client, server, protocol, - etc. DistributedFileSystem and DFSClient have moved and are now + hadoop.hdfs that reflect whether they are client, server, protocol, + etc. DistributedFileSystem and DFSClient have moved and are now considered package private. (Sanjay Radia via omalley) HADOOP-2325. Require Java 6. (cutting) @@ -8835,11 +8832,11 @@ Release 0.19.0 - 2008-11-18 HADOOP-3664. Remove the deprecated method InputFormat.validateInput, which is no longer needed. (tomwhite via omalley) - HADOOP-3549. Give more meaningful errno's in libhdfs. In particular, + HADOOP-3549. Give more meaningful errno's in libhdfs. In particular, EACCES is returned for permission problems. (Ben Slusky via omalley) HADOOP-4036. ResourceStatus was added to TaskTrackerStatus by HADOOP-3759, - so increment the InterTrackerProtocol version. (Hemanth Yamijala via + so increment the InterTrackerProtocol version. (Hemanth Yamijala via omalley) HADOOP-3150. Moves task promotion to tasks. Defines a new interface for @@ -8853,15 +8850,15 @@ Release 0.19.0 - 2008-11-18 HADOOP-3245. Adds the feature for supporting JobTracker restart. Running jobs can be recovered from the history file. The history file format has - been modified to support recovery. The task attempt ID now has the - JobTracker start time to disinguish attempts of the same TIP across + been modified to support recovery. The task attempt ID now has the + JobTracker start time to disinguish attempts of the same TIP across restarts. (Amar Ramesh Kamat via ddas) - HADOOP-4007. REMOVE DFSFileInfo - FileStatus is sufficient. + HADOOP-4007. REMOVE DFSFileInfo - FileStatus is sufficient. (Sanjay Radia via hairong) HADOOP-3722. Fixed Hadoop Streaming and Hadoop Pipes to use the Tool - interface and GenericOptionsParser. (Enis Soztutar via acmurthy) + interface and GenericOptionsParser. (Enis Soztutar via acmurthy) HADOOP-2816. Cluster summary at name node web reports the space utilization as: @@ -8873,7 +8870,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3938. Disk space quotas for HDFS. This is similar to namespace quotas in 0.18. (rangadi) - HADOOP-4293. Make Configuration Writable and remove unreleased + HADOOP-4293. Make Configuration Writable and remove unreleased WritableJobConf. Configuration.write is renamed to writeXml. (omalley) HADOOP-4281. Change dfsadmin to report available disk space in a format @@ -8884,10 +8881,10 @@ Release 0.19.0 - 2008-11-18 changed in HADOOP-2816: Non DFS Used - This indicates the disk space taken by non DFS file from the Configured capacity - DFS Used % - DFS Used % of Configured Capacity + DFS Used % - DFS Used % of Configured Capacity DFS Remaining % - Remaing % Configured Capacity available for DFS use - DFS command line report reflects the same change. Config parameter - dfs.datanode.du.pct is no longer used and is removed from the + DFS command line report reflects the same change. Config parameter + dfs.datanode.du.pct is no longer used and is removed from the hadoop-default.xml. (Suresh Srinivas via hairong) HADOOP-4116. Balancer should provide better resource management. (hairong) @@ -8904,16 +8901,16 @@ Release 0.19.0 - 2008-11-18 stream.reduce.output.field.separator All of them default to "\t". (Zheng Shao via omalley) - HADOOP-3479. Defines the configuration file for the resource manager in - Hadoop. You can configure various parameters related to scheduling, such + HADOOP-3479. Defines the configuration file for the resource manager in + Hadoop. You can configure various parameters related to scheduling, such as queues and queue properties here. The properties for a queue follow a naming convention,such as, hadoop.rm.queue.queue-name.property-name. (Hemanth Yamijala via ddas) - HADOOP-3149. Adds a way in which map/reducetasks can create multiple + HADOOP-3149. Adds a way in which map/reducetasks can create multiple outputs. (Alejandro Abdelnur via ddas) - HADOOP-3714. Add a new contrib, bash-tab-completion, which enables + HADOOP-3714. Add a new contrib, bash-tab-completion, which enables bash tab completion for the bin/hadoop script. See the README file in the contrib directory for the installation. (Chris Smith via enis) @@ -8922,7 +8919,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3772. Add a new Hadoop Instrumentation api for the JobTracker and the TaskTracker, refactor Hadoop Metrics as an implementation of the api. - (Ari Rabkin via acmurthy) + (Ari Rabkin via acmurthy) HADOOP-2302. Provides a comparator for numerical sorting of key fields. (ddas) @@ -8932,15 +8929,15 @@ Release 0.19.0 - 2008-11-18 HADOOP-657. Free disk space should be modelled and used by the scheduler to make scheduling decisions. (Ari Rabkin via omalley) - HADOOP-3719. Initial checkin of Chukwa, which is a data collection and - analysis framework. (Jerome Boulon, Andy Konwinski, Ari Rabkin, + HADOOP-3719. Initial checkin of Chukwa, which is a data collection and + analysis framework. (Jerome Boulon, Andy Konwinski, Ari Rabkin, and Eric Yang) HADOOP-3873. Add -filelimit and -sizelimit options to distcp to cap the number of files/bytes copied in a particular run to support incremental updates and mirroring. (TszWo (Nicholas), SZE via cdouglas) - HADOOP-3585. FailMon package for hardware failure monitoring and + HADOOP-3585. FailMon package for hardware failure monitoring and analysis of anomalies. (Ioannis Koltsidas via dhruba) HADOOP-1480. Add counters to the C++ Pipes API. (acmurthy via omalley) @@ -8948,7 +8945,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3854. Add support for pluggable servlet filters in the HttpServers. (Tsz Wo (Nicholas) Sze via omalley) - HADOOP-3759. Provides ability to run memory intensive jobs without + HADOOP-3759. Provides ability to run memory intensive jobs without affecting other running tasks on the nodes. (Hemanth Yamijala via ddas) HADOOP-3746. Add a fair share scheduler. (Matei Zaharia via omalley) @@ -8970,7 +8967,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3866. Added sort and multi-job updates in the JobTracker web ui. (Craig Weisenfluh via omalley) - HADOOP-3698. Add access control to control who is allowed to submit or + HADOOP-3698. Add access control to control who is allowed to submit or modify jobs in the JobTracker. (Hemanth Yamijala via omalley) HADOOP-1869. Support access times for HDFS files. (dhruba) @@ -8978,17 +8975,17 @@ Release 0.19.0 - 2008-11-18 HADOOP-3941. Extend FileSystem API to return file-checksums. (szetszwo) - HADOOP-3581. Prevents memory intensive user tasks from taking down + HADOOP-3581. Prevents memory intensive user tasks from taking down nodes. (Vinod K V via ddas) HADOOP-3970. Provides a way to recover counters written to JobHistory. (Amar Kamat via ddas) HADOOP-3702. Adds ChainMapper and ChainReducer classes allow composing - chains of Maps and Reduces in a single Map/Reduce job, something like + chains of Maps and Reduces in a single Map/Reduce job, something like MAP+ / REDUCE MAP*. (Alejandro Abdelnur via ddas) - HADOOP-3445. Add capacity scheduler that provides guaranteed capacities to + HADOOP-3445. Add capacity scheduler that provides guaranteed capacities to queues as a percentage of the cluster. (Vivek Ratan via omalley) HADOOP-3992. Add a synthetic load generation facility to the test @@ -9006,10 +9003,10 @@ Release 0.19.0 - 2008-11-18 HADOOP-4176. Implement getFileChecksum(Path) in HftpFileSystem. (szetszwo) - HADOOP-249. Reuse JVMs across Map-Reduce Tasks. + HADOOP-249. Reuse JVMs across Map-Reduce Tasks. Configuration changes to hadoop-default.xml: add mapred.job.reuse.jvm.num.tasks - (Devaraj Das via acmurthy) + (Devaraj Das via acmurthy) HADOOP-4070. Provide a mechanism in Hive for registering UDFs from the query language. (tomwhite) @@ -9022,14 +9019,14 @@ Release 0.19.0 - 2008-11-18 (cdouglas via omalley) HADOOP-3924. Added a 'KILLED' job status. (Subramaniam Krishnan via - acmurthy) + acmurthy) IMPROVEMENTS HADOOP-4205. hive: metastore and ql to use the refactored SerDe library. (zshao) - HADOOP-4106. libhdfs: add time, permission and user attribute support + HADOOP-4106. libhdfs: add time, permission and user attribute support (part 2). (Pete Wyckoff through zshao) HADOOP-4104. libhdfs: add time, permission and user attribute support. @@ -9050,7 +9047,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-2664. Add a lzop compatible codec, so that files compressed by lzop may be processed by map/reduce. (cdouglas via omalley) - HADOOP-3655. Add additional ant properties to control junit. (Steve + HADOOP-3655. Add additional ant properties to control junit. (Steve Loughran via omalley) HADOOP-3543. Update the copyright year to 2008. (cdouglas via omalley) @@ -9068,20 +9065,20 @@ Release 0.19.0 - 2008-11-18 the reduce than serialization/deserialization. (Runping Qi via cdouglas) HADOOP-3478. Improves the handling of map output fetching. Now the - randomization is by the hosts (and not the map outputs themselves). + randomization is by the hosts (and not the map outputs themselves). (Jothi Padmanabhan via ddas) HADOOP-3617. Removed redundant checks of accounting space in MapTask and makes the spill thread persistent so as to avoid creating a new one for - each spill. (Chris Douglas via acmurthy) + each spill. (Chris Douglas via acmurthy) HADOOP-3412. Factor the scheduler out of the JobTracker and make it pluggable. (Tom White and Brice Arnould via omalley) - HADOOP-3756. Minor. Remove unused dfs.client.buffer.dir from + HADOOP-3756. Minor. Remove unused dfs.client.buffer.dir from hadoop-default.xml. (rangadi) - HADOOP-3747. Adds counter suport for MultipleOutputs. + HADOOP-3747. Adds counter suport for MultipleOutputs. (Alejandro Abdelnur via ddas) HADOOP-3169. LeaseChecker daemon should not be started in DFSClient @@ -9105,16 +9102,16 @@ Release 0.19.0 - 2008-11-18 HADOOP-3620. Namenode should synchronously resolve a datanode's network location when the datanode registers. (hairong) - HADOOP-3860. NNThroughputBenchmark is extended with rename and delete + HADOOP-3860. NNThroughputBenchmark is extended with rename and delete benchmarks. (shv) - + HADOOP-3892. Include unix group name in JobConf. (Matei Zaharia via johan) HADOOP-3875. Change the time period between heartbeats to be relative to the end of the heartbeat rpc, rather than the start. This causes better behavior if the JobTracker is overloaded. (acmurthy via omalley) - HADOOP-3853. Move multiple input format (HADOOP-372) extension to + HADOOP-3853. Move multiple input format (HADOOP-372) extension to library package. (tomwhite via johan) HADOOP-9. Use roulette scheduling for temporary space when the size @@ -9123,13 +9120,13 @@ Release 0.19.0 - 2008-11-18 HADOOP-3202. Use recursive delete rather than FileUtil.fullyDelete. (Amareshwari Sriramadasu via omalley) - HADOOP-3368. Remove common-logging.properties from conf. (Steve Loughran + HADOOP-3368. Remove common-logging.properties from conf. (Steve Loughran via omalley) - HADOOP-3851. Fix spelling mistake in FSNamesystemMetrics. (Steve Loughran + HADOOP-3851. Fix spelling mistake in FSNamesystemMetrics. (Steve Loughran via omalley) - HADOOP-3780. Remove asynchronous resolution of network topology in the + HADOOP-3780. Remove asynchronous resolution of network topology in the JobTracker (Amar Kamat via omalley) HADOOP-3852. Add ShellCommandExecutor.toString method to make nicer @@ -9148,7 +9145,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3742. Remove HDFS from public java doc and add javadoc-dev for generative javadoc for developers. (Sanjay Radia via omalley) - HADOOP-3944. Improve documentation for public TupleWritable class in + HADOOP-3944. Improve documentation for public TupleWritable class in join package. (Chris Douglas via enis) HADOOP-2330. Preallocate HDFS transaction log to improve performance. @@ -9156,16 +9153,16 @@ Release 0.19.0 - 2008-11-18 HADOOP-3965. Convert DataBlockScanner into a package private class. (shv) - HADOOP-3488. Prevent hadoop-daemon from rsync'ing log files (Stefan + HADOOP-3488. Prevent hadoop-daemon from rsync'ing log files (Stefan Groshupf and Craig Macdonald via omalley) - HADOOP-3342. Change the kill task actions to require http post instead of + HADOOP-3342. Change the kill task actions to require http post instead of get to prevent accidental crawls from triggering it. (enis via omalley) - HADOOP-3937. Limit the job name in the job history filename to 50 + HADOOP-3937. Limit the job name in the job history filename to 50 characters. (Matei Zaharia via omalley) - HADOOP-3943. Remove unnecessary synchronization in + HADOOP-3943. Remove unnecessary synchronization in NetworkTopology.pseudoSortByDistance. (hairong via omalley) HADOOP-3498. File globbing alternation should be able to span path @@ -9180,7 +9177,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4147. Remove unused class JobWithTaskContext from class JobInProgress. (Amareshwari Sriramadasu via johan) - HADOOP-4151. Add a byte-comparable interface that both Text and + HADOOP-4151. Add a byte-comparable interface that both Text and BytesWritable implement. (cdouglas via omalley) HADOOP-4174. Move fs image/edit log methods from ClientProtocol to @@ -9192,7 +9189,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4186. Factor LineReader out of LineRecordReader. (tomwhite via omalley) - HADOOP-4184. Break the module dependencies between core, hdfs, and + HADOOP-4184. Break the module dependencies between core, hdfs, and mapred. (tomwhite via omalley) HADOOP-4075. test-patch.sh now spits out ant commands that it runs. @@ -9205,20 +9202,20 @@ Release 0.19.0 - 2008-11-18 (Chris K Wensel via tomwhite) HADOOP-4083. Changed the configuration attribute queue.name to - mapred.job.queue.name. (Hemanth Yamijala via acmurthy) + mapred.job.queue.name. (Hemanth Yamijala via acmurthy) HADOOP-4194. Added the JobConf and JobID to job-related methods in - JobTrackerInstrumentation for better metrics. (Mac Yang via acmurthy) + JobTrackerInstrumentation for better metrics. (Mac Yang via acmurthy) HADOOP-3975. Change test-patch script to report working the dir modifications preventing the suite from being run. (Ramya R via cdouglas) HADOOP-4124. Added a command-line switch to allow users to set job priorities, also allow it to be manipulated via the web-ui. (Hemanth - Yamijala via acmurthy) + Yamijala via acmurthy) HADOOP-2165. Augmented JobHistory to include the URIs to the tasks' - userlogs. (Vinod Kumar Vavilapalli via acmurthy) + userlogs. (Vinod Kumar Vavilapalli via acmurthy) HADOOP-4062. Remove the synchronization on the output stream when a connection is closed and also remove an undesirable exception when @@ -9233,7 +9230,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4279. Trace the seeds of random sequences in append unit tests to make itermitant failures reproducible. (szetszwo via cdouglas) - HADOOP-4209. Remove the change to the format of task attempt id by + HADOOP-4209. Remove the change to the format of task attempt id by incrementing the task attempt numbers by 1000 when the job restarts. (Amar Kamat via omalley) @@ -9245,7 +9242,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3790. Add more unit tests for testing HDFS file append. (szetszwo) - HADOOP-4321. Include documentation for the capacity scheduler. (Hemanth + HADOOP-4321. Include documentation for the capacity scheduler. (Hemanth Yamijala via omalley) HADOOP-4424. Change menu layout for Hadoop documentation (Boris Shkolnik @@ -9261,11 +9258,11 @@ Release 0.19.0 - 2008-11-18 OPTIMIZATIONS - HADOOP-3556. Removed lock contention in MD5Hash by changing the - singleton MessageDigester by an instance per Thread using + HADOOP-3556. Removed lock contention in MD5Hash by changing the + singleton MessageDigester by an instance per Thread using ThreadLocal. (Iv?n de Prado via omalley) - HADOOP-3328. When client is writing data to DFS, only the last + HADOOP-3328. When client is writing data to DFS, only the last datanode in the pipeline needs to verify the checksum. Saves around 30% CPU on intermediate datanodes. (rangadi) @@ -9281,7 +9278,7 @@ Release 0.19.0 - 2008-11-18 versions. (acmurthy via omalley) HADOOP-3769. Make the SampleMapper and SampleReducer from - GenericMRLoadGenerator public, so they can be used in other contexts. + GenericMRLoadGenerator public, so they can be used in other contexts. (Lingyun Yang via omalley) HADOOP-3514. Inline the CRCs in intermediate files as opposed to reading @@ -9290,23 +9287,23 @@ Release 0.19.0 - 2008-11-18 HADOOP-3638. Caches the iFile index files in memory to reduce seeks (Jothi Padmanabhan via ddas) - HADOOP-4225. FSEditLog.logOpenFile() should persist accessTime + HADOOP-4225. FSEditLog.logOpenFile() should persist accessTime rather than modificationTime. (shv) - HADOOP-4380. Made several new classes (Child, JVMId, - JobTrackerInstrumentation, QueueManager, ResourceEstimator, - TaskTrackerInstrumentation, and TaskTrackerMetricsInst) in + HADOOP-4380. Made several new classes (Child, JVMId, + JobTrackerInstrumentation, QueueManager, ResourceEstimator, + TaskTrackerInstrumentation, and TaskTrackerMetricsInst) in org.apache.hadoop.mapred package private instead of public. (omalley) BUG FIXES - HADOOP-3563. Refactor the distributed upgrade code so that it is + HADOOP-3563. Refactor the distributed upgrade code so that it is easier to identify datanode and namenode related code. (dhruba) HADOOP-3640. Fix the read method in the NativeS3InputStream. (tomwhite via omalley) - HADOOP-3711. Fixes the Streaming input parsing to properly find the + HADOOP-3711. Fixes the Streaming input parsing to properly find the separator. (Amareshwari Sriramadasu via ddas) HADOOP-3725. Prevent TestMiniMRMapDebugScript from swallowing exceptions. @@ -9332,15 +9329,15 @@ Release 0.19.0 - 2008-11-18 the JobTracker web/ui. (Amar Kamat via omalley) HADOOP-3777. Ensure that Lzo compressors/decompressors correctly handle the - case where native libraries aren't available. (Chris Douglas via acmurthy) + case where native libraries aren't available. (Chris Douglas via acmurthy) HADOOP-3728. Fix SleepJob so that it doesn't depend on temporary files, this ensures we can now run more than one instance of SleepJob - simultaneously. (Chris Douglas via acmurthy) + simultaneously. (Chris Douglas via acmurthy) HADOOP-3795. Fix saving image files on Namenode with different checkpoint stamps. (Lohit Vijayarenu via mahadev) - + HADOOP-3624. Improving createeditslog to create tree directory structure. (Lohit Vijayarenu via mahadev) @@ -9358,20 +9355,20 @@ Release 0.19.0 - 2008-11-18 calling it for each task start. (acmurthy via omalley) HADOOP-3131. Fix reduce progress reporting for compressed intermediate - data. (Matei Zaharia via acmurthy) + data. (Matei Zaharia via acmurthy) HADOOP-3796. fuse-dfs configuration is implemented as file system mount options. (Pete Wyckoff via dhruba) - HADOOP-3836. Fix TestMultipleOutputs to correctly clean up. (Alejandro + HADOOP-3836. Fix TestMultipleOutputs to correctly clean up. (Alejandro Abdelnur via acmurthy) HADOOP-3805. Improve fuse-dfs write performance. (Pete Wyckoff via zshao) - HADOOP-3846. Fix unit test CreateEditsLog to generate paths correctly. + HADOOP-3846. Fix unit test CreateEditsLog to generate paths correctly. (Lohit Vjayarenu via cdouglas) - + HADOOP-3904. Fix unit tests using the old dfs package name. (TszWo (Nicholas), SZE via johan) @@ -9381,13 +9378,13 @@ Release 0.19.0 - 2008-11-18 HADOOP-3907. Move INodeDirectoryWithQuota to its own .java file. (Tsz Wo (Nicholas), SZE via hairong) - HADOOP-3919. Fix attribute name in hadoop-default for + HADOOP-3919. Fix attribute name in hadoop-default for mapred.jobtracker.instrumentation. (Ari Rabkin via omalley) HADOOP-3903. Change the package name for the servlets to be hdfs instead of dfs. (Tsz Wo (Nicholas) Sze via omalley) - HADOOP-3773. Change Pipes to set the default map output key and value + HADOOP-3773. Change Pipes to set the default map output key and value types correctly. (Koji Noguchi via omalley) HADOOP-3952. Fix compilation error in TestDataJoin referencing dfs package. @@ -9403,7 +9400,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3949. Remove duplicate jars from Chukwa. (Jerome Boulon via omalley) - HADOOP-3933. DataNode sometimes sends up to io.byte.per.checksum bytes + HADOOP-3933. DataNode sometimes sends up to io.byte.per.checksum bytes more than required to client. (Ning Li via rangadi) HADOOP-3962. Shell command "fs -count" should support paths with different @@ -9415,7 +9412,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3958. Fix TestMapRed to check the success of test-job. (omalley via acmurthy) - HADOOP-3985. Fix TestHDFSServerPorts to use random ports. (Hairong Kuang + HADOOP-3985. Fix TestHDFSServerPorts to use random ports. (Hairong Kuang via omalley) HADOOP-3964. Fix javadoc warnings introduced by FailMon. (dhruba) @@ -9429,7 +9426,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3705. Fix mapred.join parser to accept InputFormats named with underscore and static, inner classes. (cdouglas) - HADOOP-4023. Fix javadoc warnings introduced when the HDFS javadoc was + HADOOP-4023. Fix javadoc warnings introduced when the HDFS javadoc was made private. (omalley) HADOOP-4030. Remove lzop from the default list of codecs. (Arun Murthy via @@ -9442,13 +9439,13 @@ Release 0.19.0 - 2008-11-18 HADOOP-2168. Fix problem with C++ record reader's progress not being reported to framework. (acmurthy via omalley) - HADOOP-3966. Copy findbugs generated output files to PATCH_DIR while + HADOOP-3966. Copy findbugs generated output files to PATCH_DIR while running test-patch. (Ramya R via lohit) HADOOP-4037. Fix the eclipse plugin for versions of kfs and log4j. (nigel via omalley) - HADOOP-3950. Cause the Mini MR cluster to wait for task trackers to + HADOOP-3950. Cause the Mini MR cluster to wait for task trackers to register before continuing. (enis via omalley) HADOOP-3910. Remove unused ClusterTestDFSNamespaceLogging and @@ -9462,18 +9459,18 @@ Release 0.19.0 - 2008-11-18 HADOOP-4069. Keep temporary test files from TestKosmosFileSystem under test.build.data instead of /tmp. (lohit via omalley) - + HADOOP-4078. Create test files for TestKosmosFileSystem in separate directory under test.build.data. (lohit) HADOOP-3968. Fix getFileBlockLocations calls to use FileStatus instead of Path reflecting the new API. (Pete Wyckoff via lohit) - HADOOP-3963. libhdfs does not exit on its own, instead it returns error + HADOOP-3963. libhdfs does not exit on its own, instead it returns error to the caller and behaves as a true library. (Pete Wyckoff via dhruba) - HADOOP-4100. Removes the cleanupTask scheduling from the Scheduler - implementations and moves it to the JobTracker. + HADOOP-4100. Removes the cleanupTask scheduling from the Scheduler + implementations and moves it to the JobTracker. (Amareshwari Sriramadasu via ddas) HADOOP-4097. Make hive work well with speculative execution turned on. @@ -9486,30 +9483,30 @@ Release 0.19.0 - 2008-11-18 (hairong) HADOOP-4071. FSNameSystem.isReplicationInProgress should add an - underReplicated block to the neededReplication queue using method + underReplicated block to the neededReplication queue using method "add" not "update". (hairong) HADOOP-4154. Fix type warnings in WritableUtils. (szetszwo via omalley) - HADOOP-4133. Log files generated by Hive should reside in the + HADOOP-4133. Log files generated by Hive should reside in the build directory. (Prasad Chakka via dhruba) HADOOP-4094. Hive now has hive-default.xml and hive-site.xml similar to core hadoop. (Prasad Chakka via dhruba) - HADOOP-4112. Handles cleanupTask in JobHistory + HADOOP-4112. Handles cleanupTask in JobHistory (Amareshwari Sriramadasu via ddas) HADOOP-3831. Very slow reading clients sometimes failed while reading. (rangadi) HADOOP-4155. Use JobTracker's start time while initializing JobHistory's - JobTracker Unique String. (lohit) + JobTracker Unique String. (lohit) HADOOP-4099. Fix null pointer when using HFTP from an 0.18 server. (dhruba via omalley) - HADOOP-3570. Includes user specified libjar files in the client side + HADOOP-3570. Includes user specified libjar files in the client side classpath path. (Sharad Agarwal via ddas) HADOOP-4129. Changed memory limits of TaskTracker and Tasks to be in @@ -9518,7 +9515,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4139. Optimize Hive multi group-by. (Namin Jain via dhruba) - HADOOP-3911. Add a check to fsck options to make sure -files is not + HADOOP-3911. Add a check to fsck options to make sure -files is not the first option to resolve conflicts with GenericOptionsParser (lohit) @@ -9539,7 +9536,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4195. Close compressor before returning to codec pool. (acmurthy via omalley) - HADOOP-2403. Escapes some special characters before logging to + HADOOP-2403. Escapes some special characters before logging to history files. (Amareshwari Sriramadasu via ddas) HADOOP-4200. Fix a bug in the test-patch.sh script. @@ -9550,7 +9547,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4121. Preserve cause for exception if the initialization of HistoryViewer for JobHistory fails. (Amareshwari Sri Ramadasu via - acmurthy) + acmurthy) HADOOP-4213. Fixes NPE in TestLimitTasksPerJobTaskScheduler. (Sreekanth Ramakrishnan via ddas) @@ -9561,7 +9558,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-3592. Fix a couple of possible file leaks in FileUtil (Bill de hOra via rangadi) - HADOOP-4120. Hive interactive shell records the time taken by a + HADOOP-4120. Hive interactive shell records the time taken by a query. (Raghotham Murthy via dhruba) HADOOP-4090. The hive scripts pick up hadoop from HADOOP_HOME @@ -9577,17 +9574,17 @@ Release 0.19.0 - 2008-11-18 examples.jar doesn't depend on tools.jar. (omalley) HADOOP-4269. Fix the deprecation of LineReader by extending the new class - into the old name and deprecating it. Also update the tests to test the + into the old name and deprecating it. Also update the tests to test the new class. (cdouglas via omalley) - HADOOP-4280. Fix conversions between seconds in C and milliseconds in + HADOOP-4280. Fix conversions between seconds in C and milliseconds in Java for access times for files. (Pete Wyckoff via rangadi) HADOOP-4254. -setSpaceQuota command does not convert "TB" extenstion to terabytes properly. Implementation now uses StringUtils for parsing this. (Raghu Angadi) - HADOOP-4259. Findbugs should run over tools.jar also. (cdouglas via + HADOOP-4259. Findbugs should run over tools.jar also. (cdouglas via omalley) HADOOP-4275. Move public method isJobValidName from JobID to a private @@ -9607,13 +9604,13 @@ Release 0.19.0 - 2008-11-18 HADOOP-4237. Fixes the TestStreamingBadRecords.testNarrowDown testcase. (Sharad Agarwal via ddas) - HADOOP-4274. Capacity scheduler accidently modifies the underlying + HADOOP-4274. Capacity scheduler accidently modifies the underlying data structures when browing the job lists. (Hemanth Yamijala via omalley) HADOOP-4309. Fix eclipse-plugin compilation. (cdouglas) HADOOP-4232. Fix race condition in JVM reuse when multiple slots become - free. (ddas via acmurthy) + free. (ddas via acmurthy) HADOOP-4302. Fix a race condition in TestReduceFetch that can yield false negatvies. (cdouglas) @@ -9627,26 +9624,26 @@ Release 0.19.0 - 2008-11-18 HADOOP-4246. Ensure we have the correct lower bound on the number of retries for fetching map-outputs; also fixed the case where the reducer automatically kills on too many unique map-outputs could not be fetched - for small jobs. (Amareshwari Sri Ramadasu via acmurthy) + for small jobs. (Amareshwari Sri Ramadasu via acmurthy) HADOOP-4163. Report FSErrors from map output fetch threads instead of merely logging them. (Sharad Agarwal via cdouglas) - HADOOP-4261. Adds a setup task for jobs. This is required so that we + HADOOP-4261. Adds a setup task for jobs. This is required so that we don't setup jobs that haven't been inited yet (since init could lead - to job failure). Only after the init has successfully happened do we + to job failure). Only after the init has successfully happened do we launch the setupJob task. (Amareshwari Sriramadasu via ddas) - HADOOP-4256. Removes Completed and Failed Job tables from + HADOOP-4256. Removes Completed and Failed Job tables from jobqueue_details.jsp. (Sreekanth Ramakrishnan via ddas) - HADOOP-4267. Occasional exceptions during shutting down HSQLDB is logged - but not rethrown. (enis) + HADOOP-4267. Occasional exceptions during shutting down HSQLDB is logged + but not rethrown. (enis) - HADOOP-4018. The number of tasks for a single job cannot exceed a + HADOOP-4018. The number of tasks for a single job cannot exceed a pre-configured maximum value. (dhruba) - HADOOP-4288. Fixes a NPE problem in CapacityScheduler. + HADOOP-4288. Fixes a NPE problem in CapacityScheduler. (Amar Kamat via ddas) HADOOP-4014. Create hard links with 'fsutil hardlink' on Windows. (shv) @@ -9666,20 +9663,20 @@ Release 0.19.0 - 2008-11-18 (Jeff Hammerbacher via omalley) HADOOP-4378. Fix TestJobQueueInformation to use SleepJob rather than - WordCount via TestMiniMRWithDFS. (Sreekanth Ramakrishnan via acmurthy) + WordCount via TestMiniMRWithDFS. (Sreekanth Ramakrishnan via acmurthy) HADOOP-4376. Fix formatting in hadoop-default.xml for - hadoop.http.filter.initializers. (Enis Soztutar via acmurthy) + hadoop.http.filter.initializers. (Enis Soztutar via acmurthy) HADOOP-4410. Adds an extra arg to the API FileUtil.makeShellPath to determine whether to canonicalize file paths or not. (Amareshwari Sriramadasu via ddas) HADOOP-4236. Ensure un-initialized jobs are killed correctly on - user-demand. (Sharad Agarwal via acmurthy) + user-demand. (Sharad Agarwal via acmurthy) HADOOP-4373. Fix calculation of Guaranteed Capacity for the - capacity-scheduler. (Hemanth Yamijala via acmurthy) + capacity-scheduler. (Hemanth Yamijala via acmurthy) HADOOP-4053. Schedulers must be notified when jobs complete. (Amar Kamat via omalley) @@ -9692,9 +9689,9 @@ Release 0.19.0 - 2008-11-18 HADOOP-4418. Updates documentation in forrest for Mapred, streaming and pipes. (Amareshwari Sriramadasu via ddas) - HADOOP-3155. Ensure that there is only one thread fetching + HADOOP-3155. Ensure that there is only one thread fetching TaskCompletionEvents on TaskTracker re-init. (Dhruba Borthakur via - acmurthy) + acmurthy) HADOOP-4425. Fix EditLogInputStream to overload the bulk read method. (cdouglas) @@ -9719,7 +9716,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4464. Separate out TestFileCreationClient from TestFileCreation. (Tsz Wo (Nicholas), SZE via cdouglas) - HADOOP-4404. saveFSImage() removes files from a storage directory that do + HADOOP-4404. saveFSImage() removes files from a storage directory that do not correspond to its type. (shv) HADOOP-4149. Fix handling of updates to the job priority, by changing the @@ -9736,8 +9733,8 @@ Release 0.19.0 - 2008-11-18 HADOOP-4230. Fix for serde2 interface, limit operator, select * operator, UDF trim functions and sampling. (Ashish Thusoo via dhruba) - HADOOP-4358. No need to truncate access time in INode. Also fixes NPE - in CreateEditsLog. (Raghu Angadi) + HADOOP-4358. No need to truncate access time in INode. Also fixes NPE + in CreateEditsLog. (Raghu Angadi) HADOOP-4387. TestHDFSFileSystemContract fails on windows nightly builds. (Raghu Angadi) @@ -9753,7 +9750,7 @@ Release 0.19.0 - 2008-11-18 regex patterns work. (Chris Wensel via acmurthy) HADOOP-4446. Modify guaranteed capacity labels in capacity scheduler's UI - to reflect the information being displayed. (Sreekanth Ramakrishnan via + to reflect the information being displayed. (Sreekanth Ramakrishnan via yhemanth) HADOOP-4282. Some user facing URLs are not filtered by user filters. @@ -9765,7 +9762,7 @@ Release 0.19.0 - 2008-11-18 HADOOP-4552. Fix a deadlock in RPC server. (Raghu Angadi) HADOOP-4471. Sort running jobs by priority in the capacity scheduler. - (Amar Kamat via yhemanth) + (Amar Kamat via yhemanth) HADOOP-4500. Fix MultiFileSplit to get the FileSystem from the relevant path rather than the JobClient. (Joydeep Sen Sarma via cdouglas) @@ -9774,12 +9771,12 @@ Release 0.18.4 - Unreleased BUG FIXES - HADOOP-5114. Remove timeout for accept() in DataNode. This makes accept() + HADOOP-5114. Remove timeout for accept() in DataNode. This makes accept() fail in JDK on Windows and causes many tests to fail. (Raghu Angadi) HADOOP-5192. Block receiver should not remove a block that's created or being written by other threads. (hairong) - + HADOOP-5134. FSNamesystem#commitBlockSynchronization adds under-construction block locations to blocksMap. (Dhruba Borthakur via hairong) @@ -9819,7 +9816,7 @@ Release 0.18.3 - 2009-01-27 HADOOP-3121. lsr should keep listing the remaining items but not terminate if there is any IOException. (szetszwo) - HADOOP-4610. Always calculate mis-replicated blocks when safe-mode is + HADOOP-4610. Always calculate mis-replicated blocks when safe-mode is turned off. (shv) HADOOP-3883. Limit namenode to assign at most one generation stamp for @@ -9908,15 +9905,15 @@ Release 0.18.3 - 2009-01-27 HADOOP-4951. Lease monitor should acquire the LeaseManager lock but not the Monitor lock. (szetszwo) - HADOOP-4935. processMisReplicatedBlocks() should not clear + HADOOP-4935. processMisReplicatedBlocks() should not clear excessReplicateMap. (shv) - HADOOP-4961. Fix ConcurrentModificationException in lease recovery + HADOOP-4961. Fix ConcurrentModificationException in lease recovery of empty files. (shv) HADOOP-4971. A long (unexpected) delay at datanodes could make subsequent block reports from many datanode at the same time. (Raghu Angadi) - + HADOOP-4910. NameNode should exclude replicas when choosing excessive replicas to delete to avoid data lose. (hairong) @@ -9955,16 +9952,16 @@ Release 0.18.2 - 2008-11-03 HADOOP-4469. Rename and add the ant task jar file to the tar file. (nigel) - HADOOP-3914. DFSClient sends Checksum Ok only once for a block. + HADOOP-3914. DFSClient sends Checksum Ok only once for a block. (Christian Kunz via hairong) - + HADOOP-4467. SerializationFactory now uses the current context ClassLoader allowing for user supplied Serialization instances. (Chris Wensel via acmurthy) HADOOP-4517. Release FSDataset lock before joining ongoing create threads. (szetszwo) - + HADOOP-4526. fsck failing with NullPointerException. (hairong) HADOOP-4483 Honor the max parameter in DatanodeDescriptor.getBlockArray(..) @@ -9993,10 +9990,10 @@ Release 0.18.1 - 2008-09-17 CodecPool when closed more than once. (Arun Murthy via cdouglas) HADOOP-4040. Remove coded default of the IPC idle connection timeout - from the TaskTracker, which was causing HDFS client connections to not be + from the TaskTracker, which was causing HDFS client connections to not be collected. (ddas via omalley) - HADOOP-4046. Made WritableComparable's constructor protected instead of + HADOOP-4046. Made WritableComparable's constructor protected instead of private to re-enable class derivation. (cdouglas via omalley) HADOOP-3940. Fix in-memory merge condition to wait when there are no map @@ -10009,7 +10006,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-2703. The default options to fsck skips checking files that are being written to. The output of fsck is incompatible - with previous release. (lohit vijayarenu via dhruba) + with previous release. (lohit vijayarenu via dhruba) HADOOP-2865. FsShell.ls() printout format changed to print file names in the end of the line. (Edward J. Yoon via shv) @@ -10019,18 +10016,18 @@ Release 0.18.0 - 2008-08-19 second RPC sets the generation stamp of an existing block. (Tsz Wo (Nicholas), SZE via dhruba) - HADOOP-2797. Code related to upgrading to 0.14 (Block CRCs) is + HADOOP-2797. Code related to upgrading to 0.14 (Block CRCs) is removed. As result, upgrade to 0.18 or later from 0.13 or earlier is not supported. If upgrading from 0.13 or earlier is required, please upgrade to an intermediate version (0.14-0.17) and then to this version. (rangadi) - HADOOP-544. This issue introduces new classes JobID, TaskID and + HADOOP-544. This issue introduces new classes JobID, TaskID and TaskAttemptID, which should be used instead of their string counterparts. - Functions in JobClient, TaskReport, RunningJob, jobcontrol.Job and - TaskCompletionEvent that use string arguments are deprecated in favor - of the corresponding ones that use ID objects. Applications can use - xxxID.toString() and xxxID.forName() methods to convert/restore objects + Functions in JobClient, TaskReport, RunningJob, jobcontrol.Job and + TaskCompletionEvent that use string arguments are deprecated in favor + of the corresponding ones that use ID objects. Applications can use + xxxID.toString() and xxxID.forName() methods to convert/restore objects to/from strings. (Enis Soztutar via ddas) HADOOP-2188. RPC client sends a ping rather than throw timeouts. @@ -10039,8 +10036,8 @@ Release 0.18.0 - 2008-08-19 The property ipc.client.timeout is removed from the default hadoop configuration. It also removes metrics RpcOpsDiscardedOPsNum. (hairong) - HADOOP-2181. This issue adds logging for input splits in Jobtracker log - and jobHistory log. Also adds web UI for viewing input splits in job UI + HADOOP-2181. This issue adds logging for input splits in Jobtracker log + and jobHistory log. Also adds web UI for viewing input splits in job UI and history UI. (Amareshwari Sriramadasu via ddas) HADOOP-3226. Run combiners multiple times over map outputs as they @@ -10057,7 +10054,7 @@ Release 0.18.0 - 2008-08-19 (Tsz Wo (Nicholas), SZE via rangadi) HADOOP-3405. Made some map/reduce internal classes non-public: - MapTaskStatus, ReduceTaskStatus, JobSubmissionProtocol, + MapTaskStatus, ReduceTaskStatus, JobSubmissionProtocol, CompletedJobStatusStore. (enis via omaley) HADOOP-3265. Removed depcrecated API getFileCacheHints(). @@ -10078,7 +10075,7 @@ Release 0.18.0 - 2008-08-19 (Mukund Madhugiri via omally) HADOOP-3113. An fsync invoked on a HDFS file really really - persists data! The datanode moves blocks in the tmp directory to + persists data! The datanode moves blocks in the tmp directory to the real block directory on a datanode-restart. (dhruba) HADOOP-3452. Change fsck to return non-zero status for a corrupt @@ -10121,24 +10118,24 @@ Release 0.18.0 - 2008-08-19 "hdfs:" URIs now defaults to 8020, so that one may simply use URIs of the form "hdfs://example.com/dir/file". (cutting) - HADOOP-2019. Adds support for .tar, .tgz and .tar.gz files in + HADOOP-2019. Adds support for .tar, .tgz and .tar.gz files in DistributedCache (Amareshwari Sriramadasu via ddas) - HADOOP-3058. Add FSNamesystem status metrics. + HADOOP-3058. Add FSNamesystem status metrics. (Lohit Vjayarenu via rangadi) HADOOP-1915. Allow users to specify counters via strings instead of enumerations. (tomwhite via omalley) - HADOOP-2065. Delay invalidating corrupt replicas of block until its - is removed from under replicated state. If all replicas are found to + HADOOP-2065. Delay invalidating corrupt replicas of block until its + is removed from under replicated state. If all replicas are found to be corrupt, retain all copies and mark the block as corrupt. (Lohit Vjayarenu via rangadi) - HADOOP-3221. Adds org.apache.hadoop.mapred.lib.NLineInputFormat, which - splits files into splits each of N lines. N can be specified by + HADOOP-3221. Adds org.apache.hadoop.mapred.lib.NLineInputFormat, which + splits files into splits each of N lines. N can be specified by configuration property "mapred.line.input.format.linespermap", which - defaults to 1. (Amareshwari Sriramadasu via ddas) + defaults to 1. (Amareshwari Sriramadasu via ddas) HADOOP-3336. Direct a subset of annotated FSNamesystem calls for audit logging. (cdouglas) @@ -10178,22 +10175,22 @@ Release 0.18.0 - 2008-08-19 HADOOP-3413. Allow SequenceFile.Reader to use serialization framework. (tomwhite via omalley) - HADOOP-3541. Import of the namespace from a checkpoint documented + HADOOP-3541. Import of the namespace from a checkpoint documented in hadoop user guide. (shv) IMPROVEMENTS - HADOOP-3677. Simplify generation stamp upgrade by making is a + HADOOP-3677. Simplify generation stamp upgrade by making is a local upgrade on datandodes. Deleted distributed upgrade. (rangadi) - + HADOOP-2928. Remove deprecated FileSystem.getContentLength(). (Lohit Vijayarenu via rangadi) HADOOP-3130. Make the connect timeout smaller for getFile. (Amar Ramesh Kamat via ddas) - HADOOP-3160. Remove deprecated exists() from ClientProtocol and + HADOOP-3160. Remove deprecated exists() from ClientProtocol and FSNamesystem (Lohit Vjayarenu via rangadi) HADOOP-2910. Throttle IPC Clients during bursts of requests or @@ -10240,10 +10237,10 @@ Release 0.18.0 - 2008-08-19 HADOOP-3398. Minor improvement to a utility function in that participates in backoff calculation. (cdouglas) - HADOOP-3381. Clear referenced when directories are deleted so that + HADOOP-3381. Clear referenced when directories are deleted so that effect of memory leaks are not multiplied. (rangadi) - HADOOP-2867. Adds the task's CWD to its LD_LIBRARY_PATH. + HADOOP-2867. Adds the task's CWD to its LD_LIBRARY_PATH. (Amareshwari Sriramadasu via ddas) HADOOP-3232. DU class runs the 'du' command in a seperate thread so @@ -10272,12 +10269,12 @@ Release 0.18.0 - 2008-08-19 rather than SequenceFiles and compression of map-outputs is now implemented by compressing the entire file rather than SequenceFile compression. Shuffle also has been changed to use a simple byte-buffer - manager rather than the InMemoryFileSystem. + manager rather than the InMemoryFileSystem. Configuration changes to hadoop-default.xml: - deprecated mapred.map.output.compression.type + deprecated mapred.map.output.compression.type (acmurthy) - HADOOP-236. JobTacker now refuses connection from a task tracker with a + HADOOP-236. JobTacker now refuses connection from a task tracker with a different version number. (Sharad Agarwal via ddas) HADOOP-3427. Improves the shuffle scheduler. It now waits for notifications @@ -10290,10 +10287,10 @@ Release 0.18.0 - 2008-08-19 HADOOP-3501. Deprecate InMemoryFileSystem. (cutting via omalley) HADOOP-3366. Stall the shuffle while in-memory merge is in progress. - (acmurthy) + (acmurthy) HADOOP-2916. Refactor src structure, but leave package structure alone. - (Raghu Angadi via mukund) + (Raghu Angadi via mukund) HADOOP-3492. Add forrest documentation for user archives. (Mahadev Konar via hairong) @@ -10304,7 +10301,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3379. Documents stream.non.zero.exit.status.is.failure for Streaming. (Amareshwari Sriramadasu via ddas) - HADOOP-3096. Improves documentation about the Task Execution Environment in + HADOOP-3096. Improves documentation about the Task Execution Environment in the Map-Reduce tutorial. (Amareshwari Sriramadasu via ddas) HADOOP-2984. Add forrest documentation for DistCp. (cdouglas) @@ -10312,7 +10309,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3406. Add forrest documentation for Profiling. (Amareshwari Sriramadasu via ddas) - HADOOP-2762. Add forrest documentation for controls of memory limits on + HADOOP-2762. Add forrest documentation for controls of memory limits on hadoop daemons and Map-Reduce tasks. (Amareshwari Sriramadasu via ddas) HADOOP-3535. Fix documentation and name of IOUtils.close to @@ -10323,7 +10320,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3547. Documents the way in which native libraries can be distributed via the DistributedCache. (Amareshwari Sriramadasu via ddas) - HADOOP-3606. Updates the Streaming doc. (Amareshwari Sriramadasu via ddas) + HADOOP-3606. Updates the Streaming doc. (Amareshwari Sriramadasu via ddas) HADOOP-3532. Add jdiff reports to the build scripts. (omalley) @@ -10333,7 +10330,7 @@ Release 0.18.0 - 2008-08-19 OPTIMIZATIONS - HADOOP-3274. The default constructor of BytesWritable creates empty + HADOOP-3274. The default constructor of BytesWritable creates empty byte array. (Tsz Wo (Nicholas), SZE via shv) HADOOP-3272. Remove redundant copy of Block object in BlocksMap. @@ -10352,7 +10349,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3369. Fast block processing during name-node startup. (shv) - HADOOP-1702. Reduce buffer copies when data is written to DFS. + HADOOP-1702. Reduce buffer copies when data is written to DFS. DataNodes take 30% less CPU while writing data. (rangadi) HADOOP-3095. Speed up split generation in the FileInputSplit, @@ -10364,16 +10361,16 @@ Release 0.18.0 - 2008-08-19 BUG FIXES - HADOOP-2905. 'fsck -move' triggers NPE in NameNode. + HADOOP-2905. 'fsck -move' triggers NPE in NameNode. (Lohit Vjayarenu via rangadi) Increment ClientProtocol.versionID missed by HADOOP-2585. (shv) HADOOP-3254. Restructure internal namenode methods that process - heartbeats to use well-defined BlockCommand object(s) instead of + heartbeats to use well-defined BlockCommand object(s) instead of using the base java Object. (Tsz Wo (Nicholas), SZE via dhruba) - HADOOP-3176. Change lease record when a open-for-write-file + HADOOP-3176. Change lease record when a open-for-write-file gets renamed. (dhruba) HADOOP-3269. Fix a case when namenode fails to restart @@ -10391,7 +10388,7 @@ Release 0.18.0 - 2008-08-19 (tomwhite via omalley) HADOOP-3270. Constant DatanodeCommands are stored in static final - immutable variables for better code clarity. + immutable variables for better code clarity. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-2793. Fix broken links for worst performing shuffle tasks in @@ -10410,7 +10407,7 @@ Release 0.18.0 - 2008-08-19 committed. Updated all references to use the new JobID representation. (taton via nigel) - HADOOP-3337. Loading FSEditLog was broken by HADOOP-3283 since it + HADOOP-3337. Loading FSEditLog was broken by HADOOP-3283 since it changed Writable serialization of DatanodeInfo. This patch handles it. (Tsz Wo (Nicholas), SZE via rangadi) @@ -10464,10 +10461,10 @@ Release 0.18.0 - 2008-08-19 HADOOP-3399. A debug message was logged at info level. (rangadi) - HADOOP-3396. TestDatanodeBlockScanner occationally fails. + HADOOP-3396. TestDatanodeBlockScanner occationally fails. (Lohit Vijayarenu via rangadi) - HADOOP-3339. Some of the failures on 3rd datanode in DFS write pipelie + HADOOP-3339. Some of the failures on 3rd datanode in DFS write pipelie are not detected properly. This could lead to hard failure of client's write operation. (rangadi) @@ -10477,7 +10474,7 @@ Release 0.18.0 - 2008-08-19 hierarchy. This also adds a new counter to track cache hits at levels greater than two. (Amar Kamat via cdouglas) - HADOOP-3375. Lease paths were sometimes not removed from + HADOOP-3375. Lease paths were sometimes not removed from LeaseManager.sortedLeasesByPath. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-3424. Values returned by getPartition should be checked to @@ -10511,7 +10508,7 @@ Release 0.18.0 - 2008-08-19 "mapred.work.output.dir" property to work post-3041. (cdouglas via omalley) HADOOP-2669. DFSClient locks pendingCreates appropriately. (dhruba) - + HADOOP-3410. Fix KFS implemenation to return correct file modification time. (Sriram Rao via cutting) @@ -10537,16 +10534,16 @@ Release 0.18.0 - 2008-08-19 org.apache.hadoop.mapred.JobShell. (Amareshwari Sriramadasu via ddas) - HADOOP-2132. Only RUNNING/PREP jobs can be killed. (Jothi Padmanabhan + HADOOP-2132. Only RUNNING/PREP jobs can be killed. (Jothi Padmanabhan via ddas) HADOOP-3476. Code cleanup in fuse-dfs. (Peter Wyckoff via dhruba) HADOOP-2427. Ensure that the cwd of completed tasks is cleaned-up - correctly on task-completion. (Amareshwari Sri Ramadasu via acmurthy) + correctly on task-completion. (Amareshwari Sri Ramadasu via acmurthy) - HADOOP-2565. Remove DFSPath cache of FileStatus. + HADOOP-2565. Remove DFSPath cache of FileStatus. (Tsz Wo (Nicholas), SZE via hairong) HADOOP-3326. Cleanup the local-fs and in-memory merge in the ReduceTask by @@ -10554,7 +10551,7 @@ Release 0.18.0 - 2008-08-19 (Sharad Agarwal via acmurthy) HADOOP-3493. Fix TestStreamingFailure to use FileUtil.fullyDelete to - ensure correct cleanup. (Lohit Vijayarenu via acmurthy) + ensure correct cleanup. (Lohit Vijayarenu via acmurthy) HADOOP-3455. Fix NPE in ipc.Client in case of connection failure and improve its synchronization. (hairong) @@ -10573,17 +10570,17 @@ Release 0.18.0 - 2008-08-19 (Nicholas), SZE) HADOOP-3440. Fixes DistributedCache to not create symlinks for paths which - don't have fragments even when createSymLink is true. - (Abhijit Bagri via ddas) + don't have fragments even when createSymLink is true. + (Abhijit Bagri via ddas) HADOOP-3463. Hadoop-daemons script should cd to $HADOOP_HOME. (omalley) HADOOP-3489. Fix NPE in SafeModeMonitor. (Lohit Vijayarenu via shv) - HADOOP-3509. Fix NPE in FSNamesystem.close. (Tsz Wo (Nicholas), SZE via + HADOOP-3509. Fix NPE in FSNamesystem.close. (Tsz Wo (Nicholas), SZE via shv) - HADOOP-3491. Name-node shutdown causes InterruptedException in + HADOOP-3491. Name-node shutdown causes InterruptedException in ResolutionMonitor. (Lohit Vijayarenu via shv) HADOOP-3511. Fixes namenode image to not set the root's quota to an @@ -10595,7 +10592,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3513. Improve NNThroughputBenchmark log messages. (shv) HADOOP-3519. Fix NPE in DFS FileSystem rename. (hairong via tomwhite) - + HADOOP-3528. Metrics FilesCreated and files_deleted metrics do not match. (Lohit via Mahadev) @@ -10640,12 +10637,12 @@ Release 0.18.0 - 2008-08-19 HADOOP-3533. Add deprecated methods to provide API compatibility between 0.18 and 0.17. Remove the deprecated methods in trunk. (omalley) - HADOOP-3580. Fixes a problem to do with specifying a har as an input to + HADOOP-3580. Fixes a problem to do with specifying a har as an input to a job. (Mahadev Konar via ddas) - HADOOP-3333. Don't assign a task to a tasktracker that it failed to + HADOOP-3333. Don't assign a task to a tasktracker that it failed to execute earlier (used to happen in the case of lost tasktrackers where - the tasktracker would reinitialize and bind to a different port). + the tasktracker would reinitialize and bind to a different port). (Jothi Padmanabhan and Arun Murthy via ddas) HADOOP-3534. Log IOExceptions that happen in closing the name @@ -10666,7 +10663,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3599. Fix JobConf::setCombineOnceOnly to modify the instance rather than a parameter. (Owen O'Malley via cdouglas) - HADOOP-3590. Null pointer exception in JobTracker when the task tracker is + HADOOP-3590. Null pointer exception in JobTracker when the task tracker is not yet resolved. (Amar Ramesh Kamat via ddas) HADOOP-3603. Fix MapOutputCollector to spill when io.sort.spill.percent is @@ -10680,7 +10677,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3480. Need to update Eclipse template to reflect current trunk. (Brice Arnould via tomwhite) - + HADOOP-3588. Fixed usability issues with archives. (mahadev) HADOOP-3635. Uncaught exception in DataBlockScanner. @@ -10711,7 +10708,7 @@ Release 0.18.0 - 2008-08-19 HADOOP-3653. Fix test-patch target to properly account for Eclipse classpath jars. (Brice Arnould via nigel) - HADOOP-3692. Fix documentation for Cluster setup and Quick start guides. + HADOOP-3692. Fix documentation for Cluster setup and Quick start guides. (Amareshwari Sriramadasu via ddas) HADOOP-3691. Fix streaming and tutorial docs. (Jothi Padmanabhan via ddas) @@ -10727,7 +10724,7 @@ Release 0.18.0 - 2008-08-19 an int, per the OutputStream contract. (Sriram Rao via cdouglas) HADOOP-3647. Add debug logs to help track down a very occassional, - hard-to-reproduce, bug in shuffle/merge on the reducer. (acmurthy) + hard-to-reproduce, bug in shuffle/merge on the reducer. (acmurthy) HADOOP-3716. Prevent listStatus in KosmosFileSystem from returning null for valid, empty directories. (Sriram Rao via cdouglas) @@ -10737,12 +10734,12 @@ Release 0.18.0 - 2008-08-19 HADOOP-3737. Fix CompressedWritable to call Deflater::end to release compressor memory. (Grant Glouser via cdouglas) - HADOOP-3670. Fixes JobTracker to clear out split bytes when no longer + HADOOP-3670. Fixes JobTracker to clear out split bytes when no longer required. (Amareshwari Sriramadasu via ddas) HADOOP-3755. Update gridmix to work with HOD 0.4 (Runping Qi via cdouglas) - - HADOOP-3743. Fix -libjars, -files, -archives options to work even if + + HADOOP-3743. Fix -libjars, -files, -archives options to work even if user code does not implement tools. (Amareshwari Sriramadasu via mahadev) HADOOP-3774. Fix typos in shell output. (Tsz Wo (Nicholas), SZE via @@ -10770,15 +10767,15 @@ Release 0.18.0 - 2008-08-19 metric_avg_time. (Lohit Vijayarenu via hairong) HADOOP-3521. Reverted the missing cast to float for sending Counters' values - to Hadoop metrics which was removed by HADOOP-544. (acmurthy) + to Hadoop metrics which was removed by HADOOP-544. (acmurthy) - HADOOP-3820. Fixes two problems in the gridmix-env - a syntax error, and a + HADOOP-3820. Fixes two problems in the gridmix-env - a syntax error, and a wrong definition of USE_REAL_DATASET by default. (Arun Murthy via ddas) HADOOP-3724. Fixes two problems related to storing and recovering lease in the fsimage. (dhruba) - - HADOOP-3827. Fixed compression of empty map-outputs. (acmurthy) + + HADOOP-3827. Fixed compression of empty map-outputs. (acmurthy) HADOOP-3865. Remove reference to FSNamesystem from metrics preventing garbage collection. (Lohit Vijayarenu via cdouglas) @@ -10788,20 +10785,20 @@ Release 0.18.0 - 2008-08-19 HADOOP-3837. Streaming jobs report progress status. (dhruba) - HADOOP-3897. Fix a NPE in secondary namenode. (Lohit Vijayarenu via + HADOOP-3897. Fix a NPE in secondary namenode. (Lohit Vijayarenu via cdouglas) HADOOP-3901. Fix bin/hadoop to correctly set classpath under cygwin. (Tsz Wo (Nicholas) Sze via omalley) - HADOOP-3947. Fix a problem in tasktracker reinitialization. + HADOOP-3947. Fix a problem in tasktracker reinitialization. (Amareshwari Sriramadasu via ddas) Release 0.17.3 - Unreleased IMPROVEMENTS - HADOOP-4164. Chinese translation of the documentation. (Xuebing Yan via + HADOOP-4164. Chinese translation of the documentation. (Xuebing Yan via omalley) BUG FIXES @@ -10809,7 +10806,7 @@ Release 0.17.3 - Unreleased HADOOP-4277. Checksum verification was mistakenly disabled for LocalFileSystem. (Raghu Angadi) - HADOOP-4271. Checksum input stream can sometimes return invalid + HADOOP-4271. Checksum input stream can sometimes return invalid data to the user. (Ning Li via rangadi) HADOOP-4318. DistCp should use absolute paths for cleanup. (szetszwo) @@ -10846,16 +10843,16 @@ Release 0.17.2 - 2008-08-11 the number of xceiver threads in a data-node. (shv) HADOOP-3370. Ensure that the TaskTracker.runningJobs data-structure is - correctly cleaned-up on task completion. (Zheng Shao via acmurthy) + correctly cleaned-up on task completion. (Zheng Shao via acmurthy) - HADOOP-3813. Fix task-output clean-up on HDFS to use the recursive + HADOOP-3813. Fix task-output clean-up on HDFS to use the recursive FileSystem.delete rather than the FileUtil.fullyDelete. (Amareshwari - Sri Ramadasu via acmurthy) + Sri Ramadasu via acmurthy) HADOOP-3859. Allow the maximum number of xceivers in the data node to be configurable. (Johan Oskarsson via omalley) - HADOOP-3931. Fix corner case in the map-side sort that causes some values + HADOOP-3931. Fix corner case in the map-side sort that causes some values to be counted as too large and cause pre-mature spills to disk. Some values will also bypass the combiner incorrectly. (cdouglas via omalley) @@ -10908,7 +10905,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2786. Move hbase out of hadoop core - HADOOP-2345. New HDFS transactions to support appending + HADOOP-2345. New HDFS transactions to support appending to files. Disk layout version changed from -11 to -12. (dhruba) HADOOP-2192. Error messages from "dfs mv" command improved. @@ -10921,7 +10918,7 @@ Release 0.17.0 - 2008-05-18 Disk layout version changed from -12 to -13. See changelist 630992 (dhruba) - HADOOP-1985. This addresses rack-awareness for Map tasks and for + HADOOP-1985. This addresses rack-awareness for Map tasks and for HDFS in a uniform way. (ddas) HADOOP-1986. Add support for a general serialization mechanism for @@ -10935,10 +10932,10 @@ Release 0.17.0 - 2008-05-18 and isDir(String) from ClientProtocol. ClientProtocol version changed from 26 to 27. (Tsz Wo (Nicholas), SZE via cdouglas) - HADOOP-2822. Remove deprecated code for classes InputFormatBase and + HADOOP-2822. Remove deprecated code for classes InputFormatBase and PhasedFileSystem. (Amareshwari Sriramadasu via enis) - HADOOP-2116. Changes the layout of the task execution directory. + HADOOP-2116. Changes the layout of the task execution directory. (Amareshwari Sriramadasu via ddas) HADOOP-2828. The following deprecated methods in Configuration.java @@ -10954,7 +10951,7 @@ Release 0.17.0 - 2008-05-18 (Amareshwari Sriramadasu via ddas) HADOOP-2823. Removes deprecated methods getColumn(), getLine() from - org.apache.hadoop.record.compiler.generated.SimpleCharStream. + org.apache.hadoop.record.compiler.generated.SimpleCharStream. (Amareshwari Sriramadasu via ddas) HADOOP-3060. Removes one unused constructor argument from MiniMRCluster. @@ -10990,7 +10987,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-3239. getFileInfo() returns null for non-existing files instead of throwing FileNotFoundException. (Lohit Vijayarenu via shv) - HADOOP-3266. Removed HOD changes from CHANGES.txt, as they are now inside + HADOOP-3266. Removed HOD changes from CHANGES.txt, as they are now inside src/contrib/hod (Hemanth Yamijala via ddas) HADOOP-3280. Separate the configuration of the virtual memory size @@ -11004,7 +11001,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2178. Job History on DFS. (Amareshwari Sri Ramadasu via ddas) - HADOOP-2063. A new parameter to dfs -get command to fetch a file + HADOOP-2063. A new parameter to dfs -get command to fetch a file even if it is corrupted. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-2219. A new command "df -count" that counts the number of @@ -11016,7 +11013,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2346. Utilities to support timeout while writing to sockets. DFSClient and DataNode sockets have 10min write timeout. (rangadi) - + HADOOP-2951. Add a contrib module that provides a utility to build or update Lucene indexes using Map/Reduce. (Ning Li via cutting) @@ -11032,14 +11029,14 @@ Release 0.17.0 - 2008-05-18 HADOOP-3001. Add job counters that measure the number of bytes read and written to HDFS, S3, KFS, and local file systems. (omalley) - HADOOP-3048. A new Interface and a default implementation to convert + HADOOP-3048. A new Interface and a default implementation to convert and restore serializations of objects to/from strings. (enis) IMPROVEMENTS - HADOOP-2655. Copy on write for data and metadata files in the + HADOOP-2655. Copy on write for data and metadata files in the presence of snapshots. Needed for supporting appends to HDFS - files. (dhruba) + files. (dhruba) HADOOP-1967. When a Path specifies the same scheme as the default FileSystem but no authority, the default FileSystem's authority is @@ -11050,7 +11047,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2895. Let the profiling string be configurable. (Martin Traverso via cdouglas) - HADOOP-910. Enables Reduces to do merges for the on-disk map output files + HADOOP-910. Enables Reduces to do merges for the on-disk map output files in parallel with their copying. (Amar Kamat via ddas) HADOOP-730. Use rename rather than copy for local renames. (cdouglas) @@ -11065,7 +11062,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2888. Make gridmix scripts more readily configurable and amenable to automated execution. (Mukund Madhugiri via cdouglas) - HADOOP-2908. A document that describes the DFS Shell command. + HADOOP-2908. A document that describes the DFS Shell command. (Mahadev Konar via dhruba) HADOOP-2981. Update README.txt to reflect the upcoming use of @@ -11078,7 +11075,7 @@ Release 0.17.0 - 2008-05-18 locally, the second off-rack, and the third intra-rack from the second. (lohit vijayarenu via cdouglas) - HADOOP-2939. Make the automated patch testing process an executable + HADOOP-2939. Make the automated patch testing process an executable Ant target, test-patch. (nigel) HADOOP-2239. Add HsftpFileSystem to permit transferring files over ssl. @@ -11117,7 +11114,7 @@ Release 0.17.0 - 2008-05-18 (Nigel Daley via cdouglas) HADOOP-3174. Illustrative example for MultipleFileInputFormat. (Enis - Soztutar via acmurthy) + Soztutar via acmurthy) HADOOP-2993. Clarify the usage of JAVA_HOME in the Quick Start guide. (acmurthy via nigel) @@ -11134,26 +11131,26 @@ Release 0.17.0 - 2008-05-18 HDFS, without negatively affecting read throughput. (rangadi) HADOOP-2399. Input key and value to combiner and reducer is reused. - (Owen O'Malley via ddas). + (Owen O'Malley via ddas). HADOOP-2423. Code optimization in FSNamesystem.mkdirs. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-2606. ReplicationMonitor selects data-nodes to replicate directly - from needed replication blocks instead of looking up for the blocks for + from needed replication blocks instead of looking up for the blocks for each live data-node. (shv) HADOOP-2148. Eliminate redundant data-node blockMap lookups. (shv) HADOOP-2027. Return the number of bytes in each block in a file - via a single rpc to the namenode to speed up job planning. + via a single rpc to the namenode to speed up job planning. (Lohit Vijaya Renu via omalley) HADOOP-2902. Replace uses of "fs.default.name" with calls to the accessor methods added in HADOOP-1967. (cutting) HADOOP-2119. Optimize scheduling of jobs with large numbers of - tasks by replacing static arrays with lists of runnable tasks. + tasks by replacing static arrays with lists of runnable tasks. (Amar Kamat via omalley) HADOOP-2919. Reduce the number of memory copies done during the @@ -11170,18 +11167,18 @@ Release 0.17.0 - 2008-05-18 HADOOP-3168. Reduce the amount of logging in streaming to an exponentially increasing number of records (up to 10,000 records/log). (Zheng Shao via omalley) - + BUG FIXES HADOOP-2195. '-mkdir' behaviour is now closer to Linux shell in case of errors. (Mahadev Konar via rangadi) - - HADOOP-2190. bring behaviour '-ls' and '-du' closer to Linux shell + + HADOOP-2190. bring behaviour '-ls' and '-du' closer to Linux shell commands in case of errors. (Mahadev Konar via rangadi) - + HADOOP-2193. 'fs -rm' and 'fs -rmr' show error message when the target file does not exist. (Mahadev Konar via rangadi) - + HADOOP-2738 Text is not subclassable because set(Text) and compareTo(Object) access the other instance's private members directly. (jimk) @@ -11190,13 +11187,13 @@ Release 0.17.0 - 2008-05-18 HADOOP-2194. dfs cat on a non-existent file throws FileNotFoundException. (Mahadev Konar via dhruba) - HADOOP-2767. Fix for NetworkTopology erroneously skipping the last leaf + HADOOP-2767. Fix for NetworkTopology erroneously skipping the last leaf node on a rack. (Hairong Kuang and Mark Butler via dhruba) HADOOP-1593. FsShell works with paths in non-default FileSystem. (Mahadev Konar via dhruba) - HADOOP-2191. du and dus command on non-existent directory gives + HADOOP-2191. du and dus command on non-existent directory gives appropriate error message. (Mahadev Konar via dhruba) HADOOP-2832. Remove tabs from code of DFSClient for better @@ -11222,7 +11219,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2912. MiniDFSCluster restart should wait for namenode to exit safemode. This was causing TestFsck to fail. (Mahadev Konar via dhruba) - HADOOP-2820. The following classes in streaming are removed : + HADOOP-2820. The following classes in streaming are removed : StreamLineRecordReader StreamOutputFormat StreamSequenceRecordReader. (Amareshwari Sri Ramadasu via ddas) @@ -11231,11 +11228,11 @@ Release 0.17.0 - 2008-05-18 setInputValueClass(Class theClass) setSpeculativeExecution getSpeculativeExecution() (Amareshwari Sri Ramadasu via ddas) - HADOOP-2817. Removes deprecated mapred.tasktracker.tasks.maximum and - ClusterStatus.getMaxTasks(). (Amareshwari Sri Ramadasu via ddas) + HADOOP-2817. Removes deprecated mapred.tasktracker.tasks.maximum and + ClusterStatus.getMaxTasks(). (Amareshwari Sri Ramadasu via ddas) HADOOP-2821. Removes deprecated ShellUtil and ToolBase classes from - the util package. (Amareshwari Sri Ramadasu via ddas) + the util package. (Amareshwari Sri Ramadasu via ddas) HADOOP-2934. The namenode was encountreing a NPE while loading leases from the fsimage. Fixed. (dhruba) @@ -11252,7 +11249,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2973. Fix TestLocalDFS for Windows platform. (Tsz Wo (Nicholas), SZE via dhruba) - HADOOP-2971. select multiple times if it returns early in + HADOOP-2971. select multiple times if it returns early in SocketIOWithTimeout. (rangadi) HADOOP-2955. Fix TestCrcCorruption test failures caused by HADOOP-2758 @@ -11267,13 +11264,13 @@ Release 0.17.0 - 2008-05-18 HADOOP-2996. Fixes uses of StringBuffer in StreamUtils class. (Dave Brosius via ddas) - HADOOP-2995. Fixes StreamBaseRecordReader's getProgress to return a + HADOOP-2995. Fixes StreamBaseRecordReader's getProgress to return a floating point number. (Dave Brosius via ddas) HADOOP-2972. Fix for a NPE in FSDataset.invalidate. (Mahadev Konar via dhruba) - HADOOP-2994. Code cleanup for DFSClient: remove redundant + HADOOP-2994. Code cleanup for DFSClient: remove redundant conversions from string to string. (Dave Brosius via dhruba) HADOOP-3009. TestFileCreation sometimes fails because restarting @@ -11285,7 +11282,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-2679. Fix a typo in libhdfs. (Jason via dhruba) - HADOOP-2976. When a lease expires, the Namenode ensures that + HADOOP-2976. When a lease expires, the Namenode ensures that blocks of the file are adequately replicated. (dhruba) HADOOP-2901. Fixes the creation of info servers in the JobClient @@ -11307,11 +11304,11 @@ Release 0.17.0 - 2008-05-18 HADOOP-3008. SocketIOWithTimeout throws InterruptedIOException if the thread is interrupted while it is waiting. (rangadi) - + HADOOP-3006. Fix wrong packet size reported by DataNode when a block is being replicated. (rangadi) - HADOOP-3029. Datanode prints log message "firstbadlink" only if + HADOOP-3029. Datanode prints log message "firstbadlink" only if it detects a bad connection to another datanode in the pipeline. (dhruba) HADOOP-3030. Release reserved space for file in InMemoryFileSystem if @@ -11320,20 +11317,20 @@ Release 0.17.0 - 2008-05-18 HADOOP-3036. Fix findbugs warnings in UpgradeUtilities. (Konstantin Shvachko via cdouglas) - HADOOP-3025. ChecksumFileSystem supports the delete method with + HADOOP-3025. ChecksumFileSystem supports the delete method with the recursive flag. (Mahadev Konar via dhruba) - HADOOP-3012. dfs -mv file to user home directory throws exception if + HADOOP-3012. dfs -mv file to user home directory throws exception if the user home directory does not exist. (Mahadev Konar via dhruba) - + HADOOP-3066. Should not require superuser privilege to query if hdfs is in safe mode (jimk) HADOOP-3040. If the input line starts with the separator char, the key - is set as empty. (Amareshwari Sriramadasu via ddas) + is set as empty. (Amareshwari Sriramadasu via ddas) HADOOP-3080. Removes flush calls from JobHistory. - (Amareshwari Sriramadasu via ddas) + (Amareshwari Sriramadasu via ddas) HADOOP-3086. Adds the testcase missed during commit of hadoop-3040. (Amareshwari Sriramadasu via ddas) @@ -11359,12 +11356,12 @@ Release 0.17.0 - 2008-05-18 HADOOP-3064. Commas in a file path should not be treated as delimiters. (Hairong Kuang via shv) - HADOOP-2997. Adds test for non-writable serialier. Also fixes a problem + HADOOP-2997. Adds test for non-writable serialier. Also fixes a problem introduced by HADOOP-2399. (Tom White via ddas) HADOOP-3114. Fix TestDFSShell on Windows. (Lohit Vijaya Renu via cdouglas) - HADOOP-3118. Fix Namenode NPE while loading fsimage after a cluster + HADOOP-3118. Fix Namenode NPE while loading fsimage after a cluster upgrade from older disk format. (dhruba) HADOOP-3161. Fix FIleUtil.HardLink.getLinkCount on Mac OS. (nigel @@ -11411,7 +11408,7 @@ Release 0.17.0 - 2008-05-18 block are bad (cdouglas) HADOOP-3157. Fix path handling in DistributedCache and TestMiniMRLocalFS. - (Doug Cutting via rangadi) + (Doug Cutting via rangadi) HADOOP-3018. Fix the eclipse plug-in contrib wrt removed deprecated methods (taton) @@ -11451,7 +11448,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-3242. Fix the RecordReader of SequenceFileAsBinaryInputFormat to correctly read from the start of the split and not the beginning of the - file. (cdouglas via acmurthy) + file. (cdouglas via acmurthy) HADOOP-3256. Encodes the job name used in the filename for history files. (Arun Murthy via ddas) @@ -11462,7 +11459,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-3263. Ensure that the job-history log file always follows the pattern of hostname_timestamp_jobid_username_jobname even if username and/or jobname are not specfied. This helps to avoid wrong assumptions - made about the job-history log filename in jobhistory.jsp. (acmurthy) + made about the job-history log filename in jobhistory.jsp. (acmurthy) HADOOP-3251. Fixes getFilesystemName in JobTracker and LocalJobRunner to use FileSystem.getUri instead of FileSystem.getName. (Arun Murthy via ddas) @@ -11470,7 +11467,7 @@ Release 0.17.0 - 2008-05-18 HADOOP-3237. Fixes TestDFSShell.testErrOutPut on Windows platform. (Mahadev Konar via ddas) - HADOOP-3279. TaskTracker checks for SUCCEEDED task status in addition to + HADOOP-3279. TaskTracker checks for SUCCEEDED task status in addition to COMMIT_PENDING status when it fails maps due to lost map. (Devaraj Das) @@ -11528,7 +11525,7 @@ Release 0.16.3 - 2008-04-16 HADOOP-3182. Change permissions of the job-submission directory to 777 from 733 to ensure sharing of HOD clusters works correctly. (Tsz Wo - (Nicholas), Sze and Amareshwari Sri Ramadasu via acmurthy) + (Nicholas), Sze and Amareshwari Sri Ramadasu via acmurthy) Release 0.16.2 - 2008-04-02 @@ -11537,7 +11534,7 @@ Release 0.16.2 - 2008-04-02 HADOOP-3011. Prohibit distcp from overwriting directories on the destination filesystem with files. (cdouglas) - HADOOP-3033. The BlockReceiver thread in the datanode writes data to + HADOOP-3033. The BlockReceiver thread in the datanode writes data to the block file, changes file position (if needed) and flushes all by itself. The PacketResponder thread does not flush block file. (dhruba) @@ -11548,10 +11545,10 @@ Release 0.16.2 - 2008-04-02 Also makes the _temporary a constant in MRConstants.java. (Amareshwari Sriramadasu via ddas) - HADOOP-3003. FileSystem cache key is updated after a + HADOOP-3003. FileSystem cache key is updated after a FileSystem object is created. (Tsz Wo (Nicholas), SZE via dhruba) - HADOOP-3042. Updates the Javadoc in JobConf.getOutputPath to reflect + HADOOP-3042. Updates the Javadoc in JobConf.getOutputPath to reflect the actual temporary path. (Amareshwari Sriramadasu via ddas) HADOOP-3007. Tolerate mirror failures while DataNode is replicating @@ -11570,7 +11567,7 @@ Release 0.16.2 - 2008-04-02 FileSystem. (Amareshwari Sriramadasu via ddas) HADOOP-3056. Fix distcp when the target is an empty directory by - making sure the directory is created first. (cdouglas and acmurthy + making sure the directory is created first. (cdouglas and acmurthy via omalley) HADOOP-3070. Protect the trash emptier thread from null pointer @@ -11585,10 +11582,10 @@ Release 0.16.2 - 2008-04-02 between the RecordReader and the map threads. (Alejandro Abdelnur via omalley) - HADOOP-2833. Do not use "Dr. Who" as the default user in JobClient. + HADOOP-2833. Do not use "Dr. Who" as the default user in JobClient. A valid user name is required. (Tsz Wo (Nicholas), SZE via rangadi) - HADOOP-3128. Throw RemoteException in setPermissions and setOwner of + HADOOP-3128. Throw RemoteException in setPermissions and setOwner of DistributedFileSystem. (shv via nigel) Release 0.16.1 - 2008-03-13 @@ -11608,17 +11605,17 @@ Release 0.16.1 - 2008-03-13 HADOOP-3098. Allow more characters in user and group names while using -chown and -chgrp commands. (rangadi) - + BUG FIXES HADOOP-2789. Race condition in IPC Server Responder that could close connections early. (Raghu Angadi) - - HADOOP-2785. minor. Fix a typo in Datanode block verification + + HADOOP-2785. minor. Fix a typo in Datanode block verification (Raghu Angadi) - + HADOOP-2788. minor. Fix help message for chgrp shell command (Raghu Angadi). - + HADOOP-1188. fstime file is updated when a storage directory containing namespace image becomes inaccessible. (shv) @@ -11657,7 +11654,7 @@ Release 0.16.1 - 2008-03-13 HADOOP-2811. Dump of counters in job history does not add comma between groups. (runping via omalley) - HADOOP-2735. Enables setting TMPDIR for tasks. + HADOOP-2735. Enables setting TMPDIR for tasks. (Amareshwari Sri Ramadasu via ddas) HADOOP-2843. Fix protections on map-side join classes to enable derivation. @@ -11678,7 +11675,7 @@ Release 0.16.1 - 2008-03-13 HADOOP-2903. Fix exception generated by Metrics while using pushMetric(). (girish vaitheeswaran via dhruba) - HADOOP-2904. Fix to RPC metrics to log the correct host name. + HADOOP-2904. Fix to RPC metrics to log the correct host name. (girish vaitheeswaran via dhruba) HADOOP-2918. Improve error logging so that dfs writes failure with @@ -11695,19 +11692,19 @@ Release 0.16.1 - 2008-03-13 datnodes flushes the block file buffered output stream before sending a positive ack for the packet back to the client. (dhruba) - HADOOP-2756. NPE in DFSClient while closing DFSOutputStreams + HADOOP-2756. NPE in DFSClient while closing DFSOutputStreams under load. (rangadi) HADOOP-2958. Fixed FileBench which broke due to HADOOP-2391 which performs a check for existence of the output directory and a trivial bug in GenericMRLoadGenerator where min/max word lenghts were identical since they were looking at the same config variables (Chris Douglas via - acmurthy) + acmurthy) HADOOP-2915. Fixed FileSystem.CACHE so that a username is included in the cache key. (Tsz Wo (Nicholas), SZE via nigel) - HADOOP-2813. TestDU unit test uses its own directory to run its + HADOOP-2813. TestDU unit test uses its own directory to run its sequence of tests. (Mahadev Konar via dhruba) Release 0.16.0 - 2008-02-07 @@ -11719,11 +11716,11 @@ Release 0.16.0 - 2008-02-07 the value configured on the jobtracker. InterTrackerProtocol version changed from 5 to 6. (Michael Bieniosek via omalley) - HADOOP-1843. Removed code from Configuration and JobConf deprecated by - HADOOP-785 and a minor fix to Configuration.toString. Specifically the - important change is that mapred-default.xml is no longer supported and + HADOOP-1843. Removed code from Configuration and JobConf deprecated by + HADOOP-785 and a minor fix to Configuration.toString. Specifically the + important change is that mapred-default.xml is no longer supported and Configuration no longer supports the notion of default/final resources. - (acmurthy) + (acmurthy) HADOOP-1302. Remove deprecated abacus code from the contrib directory. This also fixes a configuration bug in AggregateWordCount, so that the @@ -11738,7 +11735,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2185. RPC Server uses any available port if the specified port is zero. Otherwise it uses the specified port. Also combines the configuration attributes for the servers' bind address and - port from "x.x.x.x" and "y" to "x.x.x.x:y". + port from "x.x.x.x" and "y" to "x.x.x.x:y". Deprecated configuration variables: dfs.info.bindAddress dfs.info.port @@ -11771,9 +11768,9 @@ Release 0.16.0 - 2008-02-07 Protocol version changed from 21 to 22. (Raghu Angadi via dhruba) HADOOP-2110. Block report processing creates fewer transient objects. - Datanode Protocol version changed from 10 to 11. + Datanode Protocol version changed from 10 to 11. (Sanjay Radia via dhruba) - + HADOOP-2567. Add FileSystem#getHomeDirectory(), which returns the user's home directory in a FileSystem as a fully-qualified path. FileSystem#getWorkingDirectory() is also changed to return a @@ -11793,9 +11790,9 @@ Release 0.16.0 - 2008-02-07 writes to a HDFS file. Changed Data Transfer Version from 7 to 8. (dhruba) - HADOOP-2652. Fix permission issues for HftpFileSystem. This is an - incompatible change since distcp may not be able to copy files - from cluster A (compiled with this patch) to cluster B (compiled + HADOOP-2652. Fix permission issues for HftpFileSystem. This is an + incompatible change since distcp may not be able to copy files + from cluster A (compiled with this patch) to cluster B (compiled with previous versions). (Tsz Wo (Nicholas), SZE via dhruba) NEW FEATURES @@ -11809,7 +11806,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-1652. A utility to balance data among datanodes in a HDFS cluster. (Hairong Kuang via dhruba) - HADOOP-2085. A library to support map-side joins of consistently + HADOOP-2085. A library to support map-side joins of consistently partitioned and sorted data sets. (Chris Douglas via omalley) HADOOP-2336. Shell commands to modify file permissions. (rangadi) @@ -11817,7 +11814,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-1298. Implement file permissions for HDFS. (Tsz Wo (Nicholas) & taton via cutting) - HADOOP-2447. HDFS can be configured to limit the total number of + HADOOP-2447. HDFS can be configured to limit the total number of objects (inodes and blocks) in the file system. (dhruba) HADOOP-2487. Added an option to get statuses for all submitted/run jobs. @@ -11829,7 +11826,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2532. Add to MapFile a getClosest method that returns the key that comes just before if the key is not present. (stack via tomwhite) - + HADOOP-1883. Add versioning to Record I/O. (Vivek Ratan via ddas) HADOOP-2603. Add SeqeunceFileAsBinaryInputFormat, which reads @@ -11852,11 +11849,11 @@ Release 0.16.0 - 2008-02-07 HADOOP-1855. fsck verifies block placement policies and reports violations. (Konstantin Shvachko via dhruba) - HADOOP-1604. An system administrator can finalize namenode upgrades + HADOOP-1604. An system administrator can finalize namenode upgrades without running the cluster. (Konstantin Shvachko via dhruba) HADOOP-1839. Link-ify the Pending/Running/Complete/Killed grid in - jobdetails.jsp to help quickly narrow down and see categorized TIPs' + jobdetails.jsp to help quickly narrow down and see categorized TIPs' details via jobtasks.jsp. (Amar Kamat via acmurthy) HADOOP-1210. Log counters in job history. (Owen O'Malley via ddas) @@ -11867,7 +11864,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2086. This patch adds the ability to add dependencies to a job (run via JobControl) after construction. (Adrian Woodhead via ddas) - HADOOP-1185. Support changing the logging level of a server without + HADOOP-1185. Support changing the logging level of a server without restarting the server. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-2134. Remove developer-centric requirements from overview.html and @@ -11876,17 +11873,17 @@ Release 0.16.0 - 2008-02-07 HADOOP-1989. Support simulated DataNodes. This helps creating large virtual clusters for testing purposes. (Sanjay Radia via dhruba) - + HADOOP-1274. Support different number of mappers and reducers per TaskTracker to allow administrators to better configure and utilize - heterogenous clusters. + heterogenous clusters. Configuration changes to hadoop-default.xml: add mapred.tasktracker.map.tasks.maximum (default value of 2) add mapred.tasktracker.reduce.tasks.maximum (default value of 2) remove mapred.tasktracker.tasks.maximum (deprecated for 0.16.0) - (Amareshwari Sri Ramadasu via acmurthy) + (Amareshwari Sri Ramadasu via acmurthy) - HADOOP-2104. Adds a description to the ant targets. This makes the + HADOOP-2104. Adds a description to the ant targets. This makes the output of "ant -projecthelp" sensible. (Chris Douglas via ddas) HADOOP-2127. Added a pipes sort example to benchmark trivial pipes @@ -11899,8 +11896,8 @@ Release 0.16.0 - 2008-02-07 permits each to determine what files are copied into release builds. (stack via cutting) - HADOOP-1984. Makes the backoff for failed fetches exponential. - Earlier, it was a random backoff from an interval. + HADOOP-1984. Makes the backoff for failed fetches exponential. + Earlier, it was a random backoff from an interval. (Amar Kamat via ddas) HADOOP-1327. Include website documentation for streaming. (Rob Weltman @@ -11916,19 +11913,19 @@ Release 0.16.0 - 2008-02-07 HADOOP-2326. The initial block report at Datanode startup time has a random backoff period. (Sanjay Radia via dhruba) - HADOOP-2432. HDFS includes the name of the file while throwing + HADOOP-2432. HDFS includes the name of the file while throwing "File does not exist" exception. (Jim Kellerman via dhruba) HADOOP-2457. Added a 'forrest.home' property to the 'docs' target in - build.xml. (acmurthy) + build.xml. (acmurthy) - HADOOP-2149. A new benchmark for three name-node operation: file create, - open, and block report, to evaluate the name-node performance + HADOOP-2149. A new benchmark for three name-node operation: file create, + open, and block report, to evaluate the name-node performance for optimizations or new features. (Konstantin Shvachko via shv) HADOOP-2466. Change FileInputFormat.computeSplitSize to a protected non-static method to allow sub-classes to provide alternate - implementations. (Alejandro Abdelnur via acmurthy) + implementations. (Alejandro Abdelnur via acmurthy) HADOOP-2425. Change TextOutputFormat to handle Text specifically for better performance. Make NullWritable implement Comparable. Make TextOutputFormat @@ -11936,14 +11933,14 @@ Release 0.16.0 - 2008-02-07 HADOOP-1719. Improves the utilization of shuffle copier threads. (Amar Kamat via ddas) - + HADOOP-2390. Added documentation for user-controls for intermediate - map-outputs & final job-outputs and native-hadoop libraries. (acmurthy) - + map-outputs & final job-outputs and native-hadoop libraries. (acmurthy) + HADOOP-1660. Add the cwd of the map/reduce task to the java.library.path of the child-jvm to support loading of native libraries distributed via the DistributedCache. (acmurthy) - + HADOOP-2285. Speeds up TextInputFormat. Also includes updates to the Text API. (Owen O'Malley via cdouglas) @@ -11952,7 +11949,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2369. Adds a set of scripts for simulating a mix of user map/reduce workloads. (Runping Qi via cdouglas) - HADOOP-2547. Removes use of a 'magic number' in build.xml. + HADOOP-2547. Removes use of a 'magic number' in build.xml. (Hrishikesh via nigel) HADOOP-2268. Fix org.apache.hadoop.mapred.jobcontrol classes to use the @@ -11968,13 +11965,13 @@ Release 0.16.0 - 2008-02-07 deprecated mapred.speculative.execution add mapred.map.tasks.speculative.execution add mapred.reduce.tasks.speculative.execution - (Amareshwari Sri Ramadasu via acmurthy) - + (Amareshwari Sri Ramadasu via acmurthy) + HADOOP-1965. Interleave sort/spill in teh map-task along with calls to the Mapper.map method. This is done by splitting the 'io.sort.mb' buffer into two and using one half for collecting map-outputs and the other half for sort/spill. (Amar Kamat via acmurthy) - + HADOOP-2464. Unit tests for chmod, chown, and chgrp using DFS. (Raghu Angadi) @@ -11986,10 +11983,10 @@ Release 0.16.0 - 2008-02-07 add mapred.job.tracker.persist.jobstatus.hours (default value of 0) add mapred.job.tracker.persist.jobstatus.dir (default value of /jobtracker/jobsInfo) - (Alejandro Abdelnur via acmurthy) + (Alejandro Abdelnur via acmurthy) HADOOP-2077. Added version and build information to STARTUP_MSG for all - hadoop daemons to aid error-reporting, debugging etc. (acmurthy) + hadoop daemons to aid error-reporting, debugging etc. (acmurthy) HADOOP-2398. Additional instrumentation for NameNode and RPC server. Add support for accessing instrumentation statistics via JMX. @@ -12018,14 +12015,14 @@ Release 0.16.0 - 2008-02-07 HADOOP-2596. Added a SequenceFile.createWriter api which allows the user to specify the blocksize, replication factor and the buffersize to be - used for the underlying HDFS file. (Alejandro Abdelnur via acmurthy) + used for the underlying HDFS file. (Alejandro Abdelnur via acmurthy) HADOOP-2431. Test HDFS File Permissions. (Hairong Kuang via shv) HADOOP-2232. Add an option to disable Nagle's algorithm in the IPC stack. (Clint Morgan via cdouglas) - HADOOP-2342. Created a micro-benchmark for measuring + HADOOP-2342. Created a micro-benchmark for measuring local-file versus hdfs reads. (Owen O'Malley via nigel) HADOOP-2529. First version of HDFS User Guide. (Raghu Angadi) @@ -12038,13 +12035,13 @@ Release 0.16.0 - 2008-02-07 HADOOP-1898. Release the lock protecting the last time of the last stack dump while the dump is happening. (Amareshwari Sri Ramadasu via omalley) - HADOOP-1900. Makes the heartbeat and task event queries interval + HADOOP-1900. Makes the heartbeat and task event queries interval dependent on the cluster size. (Amareshwari Sri Ramadasu via ddas) - HADOOP-2208. Counter update frequency (from TaskTracker to JobTracker) is + HADOOP-2208. Counter update frequency (from TaskTracker to JobTracker) is capped at 1 minute. (Amareshwari Sri Ramadasu via ddas) - HADOOP-2284. Reduce the number of progress updates during the sorting in + HADOOP-2284. Reduce the number of progress updates during the sorting in the map task. (Amar Kamat via ddas) BUG FIXES @@ -12056,14 +12053,14 @@ Release 0.16.0 - 2008-02-07 'mkdir -p' check & create it. (Michael Bieniosek via acmurthy) HADOOP-1642. Ensure jobids generated by LocalJobRunner are unique to - avoid collissions and hence job-failures. (Doug Cutting via acmurthy) + avoid collissions and hence job-failures. (Doug Cutting via acmurthy) HADOOP-2096. Close open file-descriptors held by streams while localizing - job.xml in the JobTracker and while displaying it on the webui in + job.xml in the JobTracker and while displaying it on the webui in jobconf.jsp. (Amar Kamat via acmurthy) HADOOP-2098. Log start & completion of empty jobs to JobHistory, which - also ensures that we close the file-descriptor of the job's history log + also ensures that we close the file-descriptor of the job's history log opened during job-submission. (Amar Kamat via acmurthy) HADOOP-2112. Adding back changes to build.xml lost while reverting @@ -12077,7 +12074,7 @@ Release 0.16.0 - 2008-02-07 wrapped over the DFSInputStream since mark/reset aren't supported by DFSInputStream anymore. (Lohit Vijayarenu via acmurthy) - HADOOP-1348. Allow XML comments inside configuration files. + HADOOP-1348. Allow XML comments inside configuration files. (Rajagopal Natarajan and Enis Soztutar via enis) HADOOP-1952. Improve handling of invalid, user-specified classes while @@ -12101,34 +12098,34 @@ Release 0.16.0 - 2008-02-07 HADOOP-2078. An zero size file may have no blocks associated with it. (Konstantin Shvachko via dhruba) - HADOOP-2212. ChecksumFileSystem.getSumBufferSize might throw + HADOOP-2212. ChecksumFileSystem.getSumBufferSize might throw java.lang.ArithmeticException. The fix is to initialize bytesPerChecksum to 0. (Michael Bieniosek via ddas) HADOOP-2216. Fix jobtasks.jsp to ensure that it first collects the taskids which satisfy the filtering criteria and then use that list to print out only the required task-reports, previously it was oblivious to - the filtering and hence used the wrong index into the array of task-reports. + the filtering and hence used the wrong index into the array of task-reports. (Amar Kamat via acmurthy) HADOOP-2272. Fix findbugs target to reflect changes made to the location of the streaming jar file by HADOOP-2207. (Adrian Woodhead via nigel) - HADOOP-2244. Fixes the MapWritable.readFields to clear the instance + HADOOP-2244. Fixes the MapWritable.readFields to clear the instance field variable every time readFields is called. (Michael Stack via ddas). - HADOOP-2245. Fixes LocalJobRunner to include a jobId in the mapId. Also, + HADOOP-2245. Fixes LocalJobRunner to include a jobId in the mapId. Also, adds a testcase for JobControl. (Adrian Woodhead via ddas). - HADOOP-2275. Fix erroneous detection of corrupted file when namenode + HADOOP-2275. Fix erroneous detection of corrupted file when namenode fails to allocate any datanodes for newly allocated block. (Dhruba Borthakur via dhruba) HADOOP-2256. Fix a buf in the namenode that could cause it to encounter - an infinite loop while deleting excess replicas that were created by + an infinite loop while deleting excess replicas that were created by block rebalancing. (Hairong Kuang via dhruba) - HADOOP-2209. SecondaryNamenode process exits if it encounters exceptions + HADOOP-2209. SecondaryNamenode process exits if it encounters exceptions that it cannot handle. (Dhruba Borthakur via dhruba) HADOOP-2314. Prevent TestBlockReplacement from occasionally getting @@ -12156,16 +12153,16 @@ Release 0.16.0 - 2008-02-07 HADOOP-2359. Remove warning for interruptted exception when closing down minidfs. (dhruba via omalley) - HADOOP-1841. Prevent slow clients from consuming threads in the NameNode. + HADOOP-1841. Prevent slow clients from consuming threads in the NameNode. (dhruba) - + HADOOP-2323. JobTracker.close() should not print stack traces for normal exit. (jimk via cutting) HADOOP-2376. Prevents sort example from overriding the number of maps. (Owen O'Malley via ddas) - HADOOP-2434. FSDatasetInterface read interface causes HDFS reads to occur + HADOOP-2434. FSDatasetInterface read interface causes HDFS reads to occur in 1 byte chunks, causing performance degradation. (Raghu Angadi via dhruba) @@ -12174,16 +12171,16 @@ Release 0.16.0 - 2008-02-07 HADOOP-2215. Fix documentation in cluster_setup.html & mapred_tutorial.html reflect that mapred.tasktracker.tasks.maximum has - been superceeded by mapred.tasktracker.{map|reduce}.tasks.maximum. + been superceeded by mapred.tasktracker.{map|reduce}.tasks.maximum. (Amareshwari Sri Ramadasu via acmurthy) HADOOP-2459. Fix package target so that src/docs/build files are not included in the release. (nigel) HADOOP-2352. Remove AC_CHECK_LIB for libz and liblzo to ensure that - libhadoop.so doesn't have a dependency on them. (acmurthy) + libhadoop.so doesn't have a dependency on them. (acmurthy) - HADOOP-2453. Fix the configuration for wordcount-simple example in Hadoop + HADOOP-2453. Fix the configuration for wordcount-simple example in Hadoop Pipes which currently produces an XML parsing error. (Amareshwari Sri Ramadasu via acmurthy) @@ -12197,24 +12194,24 @@ Release 0.16.0 - 2008-02-07 reducer and the number of fetch-failures vis-a-vis total number of fetch-attempts are taken into account before teh reducer kills itself. (Amar Kamat via acmurthy) - + HADOOP-2452. Fix eclipse plug-in build.xml to refers to the right location where hadoop-*-core.jar is generated. (taton) - HADOOP-2492. Additional debugging in the rpc server to better + HADOOP-2492. Additional debugging in the rpc server to better diagnose ConcurrentModificationException. (dhruba) HADOOP-2344. Enhance the utility for executing shell commands to read the stdout/stderr streams while waiting for the command to finish (to free up the buffers). Also, this patch throws away stderr of the DF utility. - @deprecated + @deprecated org.apache.hadoop.fs.ShellCommand for org.apache.hadoop.util.Shell - org.apache.hadoop.util.ShellUtil for + org.apache.hadoop.util.ShellUtil for org.apache.hadoop.util.Shell.ShellCommandExecutor (Amar Kamat via acmurthy) HADOOP-2511. Fix a javadoc warning in org.apache.hadoop.util.Shell - introduced by HADOOP-2344. (acmurthy) + introduced by HADOOP-2344. (acmurthy) HADOOP-2442. Fix TestLocalFileSystemPermission.testLocalFSsetOwner to work on more platforms. (Raghu Angadi via nigel) @@ -12255,7 +12252,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2605. Remove bogus leading slash in task-tracker report bindAddress. (Konstantin Shvachko) - + HADOOP-2620. Trivial. 'bin/hadoop fs -help' did not list chmod, chown, and chgrp. (Raghu Angadi) @@ -12269,8 +12266,8 @@ Release 0.16.0 - 2008-02-07 HADOOP-290. A DataNode log message now prints the target of a replication request correctly. (dhruba) - HADOOP-2538. Redirect to a warning, if plaintext parameter is true but - the filter parameter is not given in TaskLogServlet. + HADOOP-2538. Redirect to a warning, if plaintext parameter is true but + the filter parameter is not given in TaskLogServlet. (Michael Bieniosek via enis) HADOOP-2582. Prevent 'bin/hadoop fs -copyToLocal' from creating @@ -12283,10 +12280,10 @@ Release 0.16.0 - 2008-02-07 the datanodes. The periodicity of this computation is now configurable. (dhruba) - HADOOP-2549. Correct disk size computation so that data-nodes could switch + HADOOP-2549. Correct disk size computation so that data-nodes could switch to other local drives if current is full. (Hairong Kuang via shv) - HADOOP-2633. Fsck should call name-node methods directly rather than + HADOOP-2633. Fsck should call name-node methods directly rather than through rpc. (Tsz Wo (Nicholas), SZE via shv) HADOOP-2687. Modify a few log message generated by dfs client to be @@ -12294,7 +12291,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2402. Fix BlockCompressorStream to ensure it buffers data before sending it down to the compressor so that each write call doesn't - compress. (Chris Douglas via acmurthy) + compress. (Chris Douglas via acmurthy) HADOOP-2645. The Metrics initialization code does not throw exceptions when servers are restarted by MiniDFSCluster. @@ -12313,12 +12310,12 @@ Release 0.16.0 - 2008-02-07 HADOOP-2626. Fix paths with special characters to work correctly with the local filesystem. (Thomas Friol via cutting) - HADOOP-2646. Fix SortValidator to work with fully-qualified + HADOOP-2646. Fix SortValidator to work with fully-qualified working directories. (Arun C Murthy via nigel) HADOOP-2092. Added a ping mechanism to the pipes' task to periodically check if the parent Java task is running, and exit if the parent isn't - alive and responding. (Amareshwari Sri Ramadasu via acmurthy) + alive and responding. (Amareshwari Sri Ramadasu via acmurthy) HADOOP-2714. TestDecommission failed on windows because the replication request was timing out. (dhruba) @@ -12329,8 +12326,8 @@ Release 0.16.0 - 2008-02-07 HADOOP-2713. TestDatanodeDeath failed on windows because the replication request was timing out. (dhruba) - HADOOP-2639. Fixes a problem to do with incorrect maintenance of values - for runningMapTasks/runningReduceTasks. (Amar Kamat and Arun Murthy + HADOOP-2639. Fixes a problem to do with incorrect maintenance of values + for runningMapTasks/runningReduceTasks. (Amar Kamat and Arun Murthy via ddas) HADOOP-2723. Fixed the check for checking whether to do user task @@ -12346,7 +12343,7 @@ Release 0.16.0 - 2008-02-07 HADOOP-2404. Fix backwards compatability with hadoop-0.15 configuration files that was broken by HADOOP-2185. (omalley) - HADOOP-2755. Fix fsck performance degradation because of permissions + HADOOP-2755. Fix fsck performance degradation because of permissions issue. (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-2768. Fix performance regression caused by HADOOP-1707. @@ -12366,16 +12363,16 @@ Release 0.15.3 - 2008-01-18 created from the task cwds. HADOOP-2574. Fixed mapred_tutorial.xml to correct minor errors with the - WordCount examples. (acmurthy) + WordCount examples. (acmurthy) Release 0.15.2 - 2008-01-02 BUG FIXES - HADOOP-2246. Moved the changelog for HADOOP-1851 from the NEW FEATURES + HADOOP-2246. Moved the changelog for HADOOP-1851 from the NEW FEATURES section to the INCOMPATIBLE CHANGES section. (acmurthy) - HADOOP-2238. Fix TaskGraphServlet so that it sets the content type of + HADOOP-2238. Fix TaskGraphServlet so that it sets the content type of the response appropriately. (Paul Saab via enis) HADOOP-2129. Fix so that distcp works correctly when source is @@ -12386,10 +12383,10 @@ Release 0.15.2 - 2008-01-02 get created after the job completes. (Alejandro Abdelnur via ddas) HADOOP-2228. Checks whether a job with a certain jobId is already running - and then tries to create the JobInProgress object. + and then tries to create the JobInProgress object. (Johan Oskarsson via ddas) - HADOOP-2422. dfs -cat multiple files fail with 'Unable to write to + HADOOP-2422. dfs -cat multiple files fail with 'Unable to write to output stream'. (Raghu Angadi via dhruba) HADOOP-2460. When the namenode encounters ioerrors on writing a @@ -12439,26 +12436,26 @@ Release 0.15.1 - 2007-11-27 IMPROVEMENTS HADOOP-1917. Addition of guides/tutorial for better overall - documentation for Hadoop. Specifically: - * quickstart.html is targetted towards first-time users and helps them - setup a single-node cluster and play with Hadoop. + documentation for Hadoop. Specifically: + * quickstart.html is targetted towards first-time users and helps them + setup a single-node cluster and play with Hadoop. * cluster_setup.html helps admins to configure and setup non-trivial hadoop clusters. - * mapred_tutorial.html is a comprehensive Map-Reduce tutorial. - (acmurthy) + * mapred_tutorial.html is a comprehensive Map-Reduce tutorial. + (acmurthy) BUG FIXES HADOOP-2174. Removed the unnecessary Reporter.setStatus call from FSCopyFilesMapper.close which led to a NPE since the reporter isn't valid - in the close method. (Chris Douglas via acmurthy) + in the close method. (Chris Douglas via acmurthy) HADOOP-2172. Restore performance of random access to local files by caching positions of local input streams, avoiding a system call. (cutting) HADOOP-2205. Regenerate the Hadoop website since some of the changes made - by HADOOP-1917 weren't correctly copied over to the trunk/docs directory. + by HADOOP-1917 weren't correctly copied over to the trunk/docs directory. Also fixed a couple of minor typos and broken links. (acmurthy) Release 0.15.0 - 2007-11-2 @@ -12473,7 +12470,7 @@ Release 0.15.0 - 2007-11-2 (Tsz Wo (Nicholas), SZE via dhruba) HADOOP-932. File locking interfaces and implementations (that were - earlier deprecated) are removed. Client Protocol version changed + earlier deprecated) are removed. Client Protocol version changed from 15 to 16. (Raghu Angadi via dhruba) HADOOP-1621. FileStatus is now a concrete class and FileSystem.listPaths @@ -12492,7 +12489,7 @@ Release 0.15.0 - 2007-11-2 with a 'final' tag may not be overridden by subsequently loaded configuration files, e.g., by jobs. (Arun C. Murthy via cutting) - HADOOP-1846. DatanodeReport in ClientProtocol can report live + HADOOP-1846. DatanodeReport in ClientProtocol can report live datanodes, dead datanodes or all datanodes. Client Protocol version changed from 17 to 18. (Hairong Kuang via dhruba) @@ -12528,17 +12525,17 @@ Release 0.15.0 - 2007-11-2 HADOOP-1351. Add "bin/hadoop job [-fail-task|-kill-task]" sub-commands to terminate a particular task-attempt. (Enis Soztutar via acmurthy) - HADOOP-1880. SleepJob : An example job that sleeps at each map and + HADOOP-1880. SleepJob : An example job that sleeps at each map and reduce task. (enis) HADOOP-1809. Add a link in web site to #hadoop IRC channel. (enis) - HADOOP-1894. Add percentage graphs and mapred task completion graphs - to Web User Interface. Users not using Firefox may install a plugin to + HADOOP-1894. Add percentage graphs and mapred task completion graphs + to Web User Interface. Users not using Firefox may install a plugin to their browsers to see svg graphics. (enis) - HADOOP-1914. Introduce a new NamenodeProtocol to allow secondary - namenodes and rebalancing processes to communicate with a primary + HADOOP-1914. Introduce a new NamenodeProtocol to allow secondary + namenodes and rebalancing processes to communicate with a primary namenode. (Hairong Kuang via dhruba) HADOOP-1963. Add a FileSystem implementation for the Kosmos @@ -12559,8 +12556,8 @@ Release 0.15.0 - 2007-11-2 HADOOP-1910. Reduce the number of RPCs that DistributedFileSystem.create() makes to the namenode. (Raghu Angadi via dhruba) - HADOOP-1565. Reduce memory usage of NameNode by replacing - TreeMap in HDFS Namespace with ArrayList. + HADOOP-1565. Reduce memory usage of NameNode by replacing + TreeMap in HDFS Namespace with ArrayList. (Dhruba Borthakur via dhruba) HADOOP-1743. Change DFS INode from a nested class to standalone @@ -12591,17 +12588,17 @@ Release 0.15.0 - 2007-11-2 HADOOP-1935. Fix a NullPointerException in internalReleaseCreate. (Dhruba Borthakur) - HADOOP-1933. The nodes listed in include and exclude files + HADOOP-1933. The nodes listed in include and exclude files are always listed in the datanode report. (Raghu Angadi via dhruba) - HADOOP-1953. The job tracker should wait beteween calls to try and delete + HADOOP-1953. The job tracker should wait beteween calls to try and delete the system directory (Owen O'Malley via devaraj) HADOOP-1932. TestFileCreation fails with message saying filestatus.dat is of incorrect size. (Dhruba Borthakur via dhruba) - HADOOP-1573. Support for 0 reducers in PIPES. + HADOOP-1573. Support for 0 reducers in PIPES. (Owen O'Malley via devaraj) HADOOP-1500. Fix typographical errors in the DFS WebUI. @@ -12668,11 +12665,11 @@ Release 0.15.0 - 2007-11-2 HADOOP-1853. Fix contrib/streaming to accept multiple -cacheFile options. (Prachi Gupta via cutting) - HADOOP-1818. Fix MultiFileInputFormat so that it does not return + HADOOP-1818. Fix MultiFileInputFormat so that it does not return empty splits when numPaths < numSplits. (Thomas Friol via enis) HADOOP-1840. Fix race condition which leads to task's diagnostic - messages getting lost. (acmurthy) + messages getting lost. (acmurthy) HADOOP-1885. Fix race condition in MiniDFSCluster shutdown. (Chris Douglas via nigel) @@ -12723,11 +12720,11 @@ Release 0.15.0 - 2007-11-2 HADOOP-1875. Non-existant directories or read-only directories are filtered from dfs.client.buffer.dir. (Hairong Kuang via dhruba) - HADOOP-1992. Fix the performance degradation in the sort validator. + HADOOP-1992. Fix the performance degradation in the sort validator. (acmurthy via omalley) HADOOP-1874. Move task-outputs' promotion/discard to a separate thread - distinct from the main heartbeat-processing thread. The main upside being + distinct from the main heartbeat-processing thread. The main upside being that we do not lock-up the JobTracker during HDFS operations, which otherwise may lead to lost tasktrackers if the NameNode is unresponsive. (Devaraj Das via acmurthy) @@ -12739,8 +12736,8 @@ Release 0.15.0 - 2007-11-2 recorded at the JobTracker, so that, for example, one may view correct information via taskdetails.jsp. This bug was introduced by HADOOP-1874. (Amar Kamat via acmurthy) - - HADOOP-2031. Correctly maintain the taskid which takes the TIP to + + HADOOP-2031. Correctly maintain the taskid which takes the TIP to completion, failing which the case of lost tasktrackers isn't handled properly i.e. the map TIP is incorrectly left marked as 'complete' and it is never rescheduled elsewhere, leading to hung reduces. @@ -12749,23 +12746,23 @@ Release 0.15.0 - 2007-11-2 HADOOP-2018. The source datanode of a data transfer waits for a response from the target datanode before closing the data stream. (Hairong Kuang via dhruba) - + HADOOP-2023. Disable TestLocalDirAllocator on Windows. (Hairong Kuang via nigel) - HADOOP-2016. Ignore status-updates from FAILED/KILLED tasks at the - TaskTracker. This fixes a race-condition which caused the tasks to wrongly + HADOOP-2016. Ignore status-updates from FAILED/KILLED tasks at the + TaskTracker. This fixes a race-condition which caused the tasks to wrongly remain in the RUNNING state even after being killed by the JobTracker and thus handicap the cleanup of the task's output sub-directory. (acmurthy) - HADOOP-1771. Fix a NullPointerException in streaming caused by an + HADOOP-1771. Fix a NullPointerException in streaming caused by an IOException in MROutputThread. (lohit vijayarenu via nigel) - HADOOP-2028. Fix distcp so that the log dir does not need to be + HADOOP-2028. Fix distcp so that the log dir does not need to be specified and the destination does not need to exist. (Chris Douglas via nigel) - HADOOP-2044. The namenode protects all lease manipulations using a + HADOOP-2044. The namenode protects all lease manipulations using a sortedLease lock. (Dhruba Borthakur) HADOOP-2051. The TaskCommit thread should not die for exceptions other @@ -12775,7 +12772,7 @@ Release 0.15.0 - 2007-11-2 HADOOP-1973. The FileSystem object would be accessed on the JobTracker through a RPC in the InterTrackerProtocol. The check for the object being null was missing and hence NPE would be thrown sometimes. This issue fixes - that problem. (Amareshwari Sri Ramadasu via ddas) + that problem. (Amareshwari Sri Ramadasu via ddas) HADOOP-2033. The SequenceFile.Writer.sync method was a no-op, which caused very uneven splits for applications like distcp that count on them. @@ -12794,24 +12791,24 @@ Release 0.15.0 - 2007-11-2 HADOOP-2073. Change size of VERSION file after writing contents to it. (Konstantin Shvachko via dhruba) - + HADOOP-2102. Fix the deprecated ToolBase to pass its Configuration object to the superceding ToolRunner to ensure it picks up the appropriate - configuration resources. (Dennis Kubes and Enis Soztutar via acmurthy) - + configuration resources. (Dennis Kubes and Enis Soztutar via acmurthy) + HADOOP-2103. Fix minor javadoc bugs introduce by HADOOP-2046. (Nigel - Daley via acmurthy) + Daley via acmurthy) IMPROVEMENTS - HADOOP-1908. Restructure data node code so that block sending and + HADOOP-1908. Restructure data node code so that block sending and receiving are seperated from data transfer header handling. (Hairong Kuang via dhruba) HADOOP-1921. Save the configuration of completed/failed jobs and make them available via the web-ui. (Amar Kamat via devaraj) - HADOOP-1266. Remove dependency of package org.apache.hadoop.net on + HADOOP-1266. Remove dependency of package org.apache.hadoop.net on org.apache.hadoop.dfs. (Hairong Kuang via dhruba) HADOOP-1779. Replace INodeDirectory.getINode() by a getExistingPathINodes() @@ -12884,10 +12881,10 @@ Release 0.15.0 - 2007-11-2 (Enis Soztutar via cutting) HADOOP-1569. Reimplement DistCP to use the standard FileSystem/URI - code in Hadoop so that you can copy from and to all of the supported file + code in Hadoop so that you can copy from and to all of the supported file systems.(Chris Douglas via omalley) - HADOOP-1018. Improve documentation w.r.t handling of lost hearbeats between + HADOOP-1018. Improve documentation w.r.t handling of lost hearbeats between TaskTrackers and JobTracker. (acmurthy) HADOOP-1718. Add ant targets for measuring code coverage with clover. @@ -12912,16 +12909,16 @@ Release 0.15.0 - 2007-11-2 HADOOP-1971. Warn when job does not specify a jar. (enis via cutting) - HADOOP-1942. Increase the concurrency of transaction logging to + HADOOP-1942. Increase the concurrency of transaction logging to edits log. Reduce the number of syncs by double-buffering the changes to the transaction log. (Dhruba Borthakur) HADOOP-2046. Improve mapred javadoc. (Arun C. Murthy via cutting) - HADOOP-2105. Improve overview.html to clarify supported platforms, - software pre-requisites for hadoop, how to install them on various - platforms and a better general description of hadoop and it's utility. - (Jim Kellerman via acmurthy) + HADOOP-2105. Improve overview.html to clarify supported platforms, + software pre-requisites for hadoop, how to install them on various + platforms and a better general description of hadoop and it's utility. + (Jim Kellerman via acmurthy) Release 0.14.4 - 2007-11-26 @@ -12933,7 +12930,7 @@ Release 0.14.4 - 2007-11-26 HADOOP-2169. Fix the DT_SONAME field of libhdfs.so to set it to the correct value of 'libhdfs.so', currently it is set to the absolute path of - libhdfs.so. (acmurthy) + libhdfs.so. (acmurthy) HADOOP-2001. Make the job priority updates and job kills synchronized on the JobTracker. Deadlock was seen in the JobTracker because of the lack of @@ -12944,7 +12941,7 @@ Release 0.14.3 - 2007-10-19 BUG FIXES - HADOOP-2053. Fixed a dangling reference to a memory buffer in the map + HADOOP-2053. Fixed a dangling reference to a memory buffer in the map output sorter. (acmurthy via omalley) HADOOP-2036. Fix a NullPointerException in JvmMetrics class. (nigel) @@ -12960,9 +12957,9 @@ Release 0.14.2 - 2007-10-09 HADOOP-1948. Removed spurious error message during block crc upgrade. (Raghu Angadi via dhruba) - HADOOP-1862. reduces are getting stuck trying to find map outputs. + HADOOP-1862. reduces are getting stuck trying to find map outputs. (Arun C. Murthy via ddas) - + HADOOP-1977. Fixed handling of ToolBase cli options in JobClient. (enis via omalley) @@ -13058,7 +13055,7 @@ Release 0.14.0 - 2007-08-17 to be the same as the replication factor of the original file. (Dhruba Borthakur via tomwhite.) - 6. HADOOP-1355. Fix null pointer dereference in + 6. HADOOP-1355. Fix null pointer dereference in TaskLogAppender.append(LoggingEvent). (Arun C Murthy via tomwhite.) 7. HADOOP-1357. Fix CopyFiles to correctly avoid removing "/". @@ -13311,7 +13308,7 @@ Release 0.14.0 - 2007-08-17 83. HADOOP-1520. Add appropriate synchronization to FSEditsLog. (Dhruba Borthakur via nigel) - 84. HADOOP-1513. Fix a race condition in directory creation. + 84. HADOOP-1513. Fix a race condition in directory creation. (Devaraj via omalley) 85. HADOOP-1546. Remove spurious column from HDFS web UI. @@ -13436,7 +13433,7 @@ Release 0.14.0 - 2007-08-17 to support later versions of ec2-api-tools. (Stu Hood via tomwhite) 133. HADOOP-1638. Fix contrib EC2 scripts to support NAT addressing. - (Stu Hood via tomwhite) + (Stu Hood via tomwhite) 134. HADOOP-1632. Fix an IllegalArgumentException in fsck. (Hairong Kuang via cutting) @@ -13469,7 +13466,7 @@ Release 0.14.0 - 2007-08-17 143. HADOOP-1553. Replace user task output and log capture code to use shell redirection instead of copier threads in the TaskTracker. Capping the - size of the output is now done via tail in memory and thus should not be + size of the output is now done via tail in memory and thus should not be large. The output of the tasklog servlet is not forced into UTF8 and is not buffered entirely in memory. (omalley) Configuration changes to hadoop-default.xml: @@ -13503,7 +13500,7 @@ Release 0.14.0 - 2007-08-17 148. HADOOP-1680. Improvements to Block CRC upgrade messages. (Raghu Angadi via dhruba) -149. HADOOP-71. Allow Text and SequenceFile Map/Reduce inputs from non-default +149. HADOOP-71. Allow Text and SequenceFile Map/Reduce inputs from non-default filesystems. (omalley) 150. HADOOP-1568. Expose HDFS as xml/http filesystem to provide cross-version @@ -13617,7 +13614,7 @@ Release 0.13.0 - 2007-06-08 25. HADOOP-1170. Improve datanode performance by removing device checks from common operations. (Igor Bolotin via cutting) -26. HADOOP-1090. Fix SortValidator's detection of whether the input +26. HADOOP-1090. Fix SortValidator's detection of whether the input file belongs to the sort-input or sort-output directory. (Arun C Murthy via tomwhite) @@ -13644,7 +13641,7 @@ Release 0.13.0 - 2007-06-08 34. HADOOP-1133. Add tool to analyze and debug namenode on a production cluster. (Dhruba Borthakur via tomwhite) -35. HADOOP-1151. Remove spurious printing to stderr in streaming +35. HADOOP-1151. Remove spurious printing to stderr in streaming PipeMapRed. (Koji Noguchi via tomwhite) 36. HADOOP-988. Change namenode to use a single map of blocks to metadata. @@ -13658,40 +13655,40 @@ Release 0.13.0 - 2007-06-08 long-running unit tests may be automatically terminated. (Nigel Daley via cutting) -39. HADOOP-1149. Improve DFS Scalability: make - processOverReplicatedBlock() a no-op if blocks are not +39. HADOOP-1149. Improve DFS Scalability: make + processOverReplicatedBlock() a no-op if blocks are not over-replicated. (Raghu Angadi via tomwhite) -40. HADOOP-1149. Improve DFS Scalability: optimize getDistance(), - contains(), and isOnSameRack() in NetworkTopology. +40. HADOOP-1149. Improve DFS Scalability: optimize getDistance(), + contains(), and isOnSameRack() in NetworkTopology. (Hairong Kuang via tomwhite) -41. HADOOP-1218. Make synchronization on TaskTracker's RunningJob +41. HADOOP-1218. Make synchronization on TaskTracker's RunningJob object consistent. (Devaraj Das via tomwhite) -42. HADOOP-1219. Ignore progress report once a task has reported as +42. HADOOP-1219. Ignore progress report once a task has reported as 'done'. (Devaraj Das via tomwhite) 43. HADOOP-1114. Permit user to specify additional CLASSPATH elements with a HADOOP_CLASSPATH environment variable. (cutting) -44. HADOOP-1198. Remove ipc.client.timeout parameter override from +44. HADOOP-1198. Remove ipc.client.timeout parameter override from unit test configuration. Using the default is more robust and has almost the same run time. (Arun C Murthy via tomwhite) -45. HADOOP-1211. Remove deprecated constructor and unused static +45. HADOOP-1211. Remove deprecated constructor and unused static members in DataNode class. (Konstantin Shvachko via tomwhite) -46. HADOOP-1136. Fix ArrayIndexOutOfBoundsException in - FSNamesystem$UnderReplicatedBlocks add() method. +46. HADOOP-1136. Fix ArrayIndexOutOfBoundsException in + FSNamesystem$UnderReplicatedBlocks add() method. (Hairong Kuang via tomwhite) 47. HADOOP-978. Add the client name and the address of the node that - previously started to create the file to the description of + previously started to create the file to the description of AlreadyBeingCreatedException. (Konstantin Shvachko via tomwhite) -48. HADOOP-1001. Check the type of keys and values generated by the - mapper against the types specified in JobConf. +48. HADOOP-1001. Check the type of keys and values generated by the + mapper against the types specified in JobConf. (Tahir Hashmi via tomwhite) 49. HADOOP-971. Improve DFS Scalability: Improve name node performance @@ -13722,27 +13719,27 @@ Release 0.13.0 - 2007-06-08 56. HADOOP-1239. Add a package name to some testjar test classes. (Jim Kellerman via cutting) -57. HADOOP-1241. Fix NullPointerException in processReport when +57. HADOOP-1241. Fix NullPointerException in processReport when namenode is restarted. (Dhruba Borthakur via tomwhite) -58. HADOOP-1244. Fix stop-dfs.sh to no longer incorrectly specify - slaves file for stopping datanode. +58. HADOOP-1244. Fix stop-dfs.sh to no longer incorrectly specify + slaves file for stopping datanode. (Michael Bieniosek via tomwhite) -59. HADOOP-1253. Fix ConcurrentModificationException and - NullPointerException in JobControl. +59. HADOOP-1253. Fix ConcurrentModificationException and + NullPointerException in JobControl. (Johan Oskarson via tomwhite) 60. HADOOP-1256. Fix NameNode so that multiple DataNodeDescriptors can no longer be created on startup. (Hairong Kuang via cutting) -61. HADOOP-1214. Replace streaming classes with new counterparts +61. HADOOP-1214. Replace streaming classes with new counterparts from Hadoop core. (Runping Qi via tomwhite) 62. HADOOP-1250. Move a chmod utility from streaming to FileUtil. (omalley via cutting) -63. HADOOP-1258. Fix TestCheckpoint test case to wait for +63. HADOOP-1258. Fix TestCheckpoint test case to wait for MiniDFSCluster to be active. (Nigel Daley via tomwhite) 64. HADOOP-1148. Re-indent all Java source code to consistently use @@ -13751,10 +13748,10 @@ Release 0.13.0 - 2007-06-08 65. HADOOP-1251. Add a method to Reporter to get the map InputSplit. (omalley via cutting) -66. HADOOP-1224. Fix "Browse the filesystem" link to no longer point +66. HADOOP-1224. Fix "Browse the filesystem" link to no longer point to dead datanodes. (Enis Soztutar via tomwhite) -67. HADOOP-1154. Fail a streaming task if the threads reading from or +67. HADOOP-1154. Fail a streaming task if the threads reading from or writing to the streaming process fail. (Koji Noguchi via tomwhite) 68. HADOOP-968. Move shuffle and sort to run in reduce's child JVM, @@ -13773,25 +13770,25 @@ Release 0.13.0 - 2007-06-08 rename causing possible reduce task hang. (Tahir Hashmi via tomwhite) -72. HADOOP-1050. Distinguish between failed and killed tasks so as to - not count a lost tasktracker against the job. +72. HADOOP-1050. Distinguish between failed and killed tasks so as to + not count a lost tasktracker against the job. (Arun C Murthy via tomwhite) -73. HADOOP-1271. Fix StreamBaseRecordReader to be able to log record +73. HADOOP-1271. Fix StreamBaseRecordReader to be able to log record data that's not UTF-8. (Arun C Murthy via tomwhite) -74. HADOOP-1190. Fix unchecked warnings in main Hadoop code. +74. HADOOP-1190. Fix unchecked warnings in main Hadoop code. (tomwhite) -75. HADOOP-1127. Fix AlreadyBeingCreatedException in namenode for +75. HADOOP-1127. Fix AlreadyBeingCreatedException in namenode for jobs run with speculative execution. (Arun C Murthy via tomwhite) 76. HADOOP-1282. Omnibus HBase patch. Improved tests & configuration. (Jim Kellerman via cutting) -77. HADOOP-1262. Make dfs client try to read from a different replica - of the checksum file when a checksum error is detected. +77. HADOOP-1262. Make dfs client try to read from a different replica + of the checksum file when a checksum error is detected. (Hairong Kuang via tomwhite) 78. HADOOP-1279. Fix JobTracker to maintain list of recently @@ -13817,7 +13814,7 @@ Release 0.13.0 - 2007-06-08 shuffle, sort and reduce. Use this to implement reduce=NONE option in contrib/streaming. (Runping Qi via cutting) -84. HADOOP-1294. Fix unchecked warnings in main Hadoop code under +84. HADOOP-1294. Fix unchecked warnings in main Hadoop code under Java 6. (tomwhite) 85. HADOOP-1299. Fix so that RPC will restart after RPC.stopClient() @@ -13829,16 +13826,16 @@ Release 0.13.0 - 2007-06-08 87. HADOOP-1290. Move contrib/abacus into mapred/lib/aggregate. (Runping Qi via cutting) -88. HADOOP-1272. Extract inner classes from FSNamesystem into separate +88. HADOOP-1272. Extract inner classes from FSNamesystem into separate classes. (Dhruba Borthakur via tomwhite) 89. HADOOP-1247. Add support to contrib/streaming for aggregate package, formerly called Abacus. (Runping Qi via cutting) 90. HADOOP-1061. Fix bug in listing files in the S3 filesystem. - NOTE: this change is not backwards compatible! You should use the - MigrationTool supplied to migrate existing S3 filesystem data to - the new format. Please backup your data first before upgrading + NOTE: this change is not backwards compatible! You should use the + MigrationTool supplied to migrate existing S3 filesystem data to + the new format. Please backup your data first before upgrading (using 'hadoop distcp' for example). (tomwhite) 91. HADOOP-1304. Make configurable the maximum number of task @@ -13961,7 +13958,7 @@ Release 0.13.0 - 2007-06-08 to indicate the default directory, per HADOOP-1386. (Hairong Kuang via cutting) -128. HADOOP-1411. Make task retry framework handle +128. HADOOP-1411. Make task retry framework handle AlreadyBeingCreatedException when wrapped as a RemoteException. (Hairong Kuang via tomwhite) @@ -14005,11 +14002,11 @@ Release 0.12.3 - 2007-04-06 command and a performance problem in HDFS's implementation of it. (Hairong Kuang via cutting) - 7. HADOOP-1105. Fix reducers to make "progress" while iterating + 7. HADOOP-1105. Fix reducers to make "progress" while iterating through values. (Devaraj Das & Owen O'Malley via tomwhite) - 8. HADOOP-1179. Make Task Tracker close index file as soon as the read - is done when serving get-map-output requests. + 8. HADOOP-1179. Make Task Tracker close index file as soon as the read + is done when serving get-map-output requests. (Devaraj Das via tomwhite) @@ -14149,14 +14146,14 @@ Release 0.12.0 - 2007-03-02 13. HADOOP-923. In HDFS NameNode, move replication computation to a separate thread, to improve heartbeat processing time. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 14. HADOOP-476. Rewrite contrib/streaming command-line processing, improving parameter validation. (Sanjay Dahiya via cutting) 15. HADOOP-973. Improve error messages in Namenode. This should help to track down a problem that was appearing as a - NullPointerException. (Dhruba Borthakur via cutting) + NullPointerException. (Dhruba Borthakur via cutting) 16. HADOOP-649. Fix so that jobs with no tasks are not lost. (Thomas Friol via cutting) @@ -14171,7 +14168,7 @@ Release 0.12.0 - 2007-03-02 (Milind Bhandarkar via cutting) 20. HADOOP-943. Improve HDFS's fsck command to display the filename - for under-replicated blocks. (Dhruba Borthakur via cutting) + for under-replicated blocks. (Dhruba Borthakur via cutting) 21. HADOOP-333. Add validator for sort benchmark output. (Arun C Murthy via cutting) @@ -14197,7 +14194,7 @@ Release 0.12.0 - 2007-03-02 27. HADOOP-952. Create a public (shared) Hadoop EC2 AMI. The EC2 scripts now support launch of public AMIs. (tomwhite) - + 28. HADOOP-1025. Remove some obsolete code in ipc.Server. (cutting) 29. HADOOP-997. Implement S3 retry mechanism for failed block @@ -14268,7 +14265,7 @@ Release 0.12.0 - 2007-03-02 (Devaraj Das via cutting) 49. HADOOP-940. Improve HDFS's replication scheduling. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 50. HADOOP-1020. Fix a bug in Path resolution, and a with unit tests on Windows. (cutting) @@ -14302,7 +14299,7 @@ Release 0.12.0 - 2007-03-02 61. HADOOP-994. In HDFS, limit the number of blocks invalidated at once. Large lists were causing datenodes to timeout. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 62. HADOOP-432. Add a trash feature, disabled by default. When enabled, the FSShell 'rm' command will move things to a trash @@ -14313,7 +14310,7 @@ Release 0.12.0 - 2007-03-02 Release 0.11.2 - 2007-02-16 1. HADOOP-1009. Fix an infinite loop in the HDFS namenode. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 2. HADOOP-1014. Disable in-memory merging during shuffle, as this is causing data corruption. (Devaraj Das via cutting) @@ -14423,7 +14420,7 @@ Release 0.11.0 - 2007-02-02 27. [ intentionally blank ] 28. HADOOP-227. Add support for backup namenodes, which periodically - get snapshots of the namenode state. (Dhruba Borthakur via cutting) + get snapshots of the namenode state. (Dhruba Borthakur via cutting) 29. HADOOP-884. Add scripts in contrib/ec2 to facilitate running Hadoop on an Amazon's EC2 cluster. (Tom White via cutting) @@ -14547,10 +14544,10 @@ Release 0.10.0 - 2007-01-05 datanodes. (Mahadev Konar via cutting) 3. HADOOP-621. Change 'dfs -cat' to exit sooner when output has been - closed. (Dhruba Borthakur via cutting) + closed. (Dhruba Borthakur via cutting) 4. HADOOP-752. Rationalize some synchronization in DFS namenode. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 5. HADOOP-629. Fix RPC services to better check the protocol name and version. (omalley via cutting) @@ -14558,7 +14555,7 @@ Release 0.10.0 - 2007-01-05 6. HADOOP-774. Limit the number of invalid blocks returned with heartbeats by the namenode to datanodes. Transmitting and processing very large invalid block lists can tie up both the - namenode and datanode for too long. (Dhruba Borthakur via cutting) + namenode and datanode for too long. (Dhruba Borthakur via cutting) 7. HADOOP-738. Change 'dfs -get' command to not create CRC files by default, adding a -crc option to force their creation. @@ -14591,7 +14588,7 @@ Release 0.10.0 - 2007-01-05 information in the web interface. (Sanjay Dahiya via cutting) 16. HADOOP-764. Reduce memory allocations in namenode some. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 17. HADOOP-802. Update description of mapred.speculative.execution to mention reduces. (Nigel Daley via cutting) @@ -14605,7 +14602,7 @@ Release 0.10.0 - 2007-01-05 20. HADOOP-782. Fully remove killed tasks. (Arun C Murthy via cutting) 21. HADOOP-792. Fix 'dfs -mv' to return correct status. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 22. HADOOP-673. Give each task its own working directory again. (Mahadev Konar via cutting) @@ -14620,7 +14617,7 @@ Release 0.10.0 - 2007-01-05 (cutting) 24. HADOOP-720. Add an HDFS white paper to website. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 25. HADOOP-794. Fix a divide-by-zero exception when a job specifies zero map tasks. (omalley via cutting) @@ -14654,7 +14651,7 @@ Release 0.10.0 - 2007-01-05 33. HADOOP-829. Within HDFS, clearly separate three different representations for datanodes: one for RPCs, one for namenode-internal use, and one for namespace persistence. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 34. HADOOP-823. Fix problem starting datanode when not all configured data directories exist. (Bryan Pendleton via cutting) @@ -14665,7 +14662,7 @@ Release 0.10.0 - 2007-01-05 longer passed in several methods, input validation has changed, etc. (omalley via cutting) -36. HADOOP-814. Optimize locking in namenode. (Dhruba Borthakur via cutting) +36. HADOOP-814. Optimize locking in namenode. (Dhruba Borthakur via cutting) 37. HADOOP-738. Change 'fs -put' and 'fs -get' commands to accept standard input and output, respectively. Standard i/o is @@ -14776,7 +14773,7 @@ Release 0.9.0 - 2006-12-01 configured with a non-existent directory. (Sanjay Dahiya via cutting) 4. HADOOP-645. Fix a bug in contrib/streaming when -reducer is NONE. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 5. HADOOP-687. Fix a classpath bug in bin/hadoop that blocked the servers from starting. (Sameer Paranjpye via omalley) @@ -14807,7 +14804,7 @@ Release 0.9.0 - 2006-12-01 SequenceFile. (Devaraj Das via cutting) 14. HADOOP-688. Move DFS administrative commands to a separate - command named 'dfsadmin'. (Dhruba Borthakur via cutting) + command named 'dfsadmin'. (Dhruba Borthakur via cutting) 15. HADOOP-708. Fix test-libhdfs to return the correct status, so that failures will break the build. (Nigel Daley via cutting) @@ -14916,7 +14913,7 @@ Release 0.8.0 - 2006-11-03 1. HADOOP-477. Extend contrib/streaming to scan the PATH environment variables when resolving executable program names. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 2. HADOOP-583. In DFSClient, reduce the log level of re-connect attempts from 'info' to 'debug', so they are not normally shown. @@ -14936,11 +14933,11 @@ Release 0.8.0 - 2006-11-03 7. HADOOP-462. Improve command line parsing in DFSShell, so that incorrect numbers of arguments result in informative errors rather - than ArrayOutOfBoundsException. (Dhruba Borthakur via cutting) + than ArrayOutOfBoundsException. (Dhruba Borthakur via cutting) 8. HADOOP-561. Fix DFS so that one replica of each block is written locally, if possible. This was the intent, but there as a bug. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 9. HADOOP-610. Fix TaskTracker to survive more exceptions, keeping tasks from becoming lost. (omalley via cutting) @@ -14949,7 +14946,7 @@ Release 0.8.0 - 2006-11-03 stack dump, useful for debugging. (omalley via cutting) 11. HADOOP-554. Fix DFSShell to return -1 for errors. - (Dhruba Borthakur via cutting) + (Dhruba Borthakur via cutting) 12. HADOOP-626. Correct the documentation in the NNBench example code, and also remove a mistaken call there. @@ -15089,7 +15086,7 @@ Release 0.7.0 - 2006-10-06 1. HADOOP-243. Fix rounding in the display of task and job progress so that things are not shown to be 100% complete until they are in - fact finished. (omalley via cutting) + fact finished. (omalley via cutting) 2. HADOOP-438. Limit the length of absolute paths in DFS, since the file format used to store pathnames has some limitations. @@ -15717,7 +15714,7 @@ Release 0.3.1 - 2006-06-05 waiting for map outputs, so that they do not time out. (Mahadev Konar via cutting) - 4. HADOOP-245 and HADOOP-246. Improvements to record io package. + 4. HADOOP-245 and HADOOP-246. Improvements to record io package. (Mahadev Konar via cutting) 5. HADOOP-276. Add logging config files to jar file so that they're @@ -15921,7 +15918,7 @@ Release 0.2.0 - 2006-05-05 23. Fix HADOOP-162. Fix ConcurrentModificationException when releasing file locks. (omalley via cutting) -24. Fix HADOOP-132. Initial check-in of new Metrics API, including +24. Fix HADOOP-132. Initial check-in of new Metrics API, including implementations for writing metric data to a file and for sending it to Ganglia. (David Bowen via cutting) @@ -16040,7 +16037,7 @@ Release 0.1.1 - 2006-04-08 3. Fix HADOOP-117. Pathnames were mistakenly transposed in JobConf.getLocalFile() causing many mapred temporary files to not be removed. (Raghavendra Prabhu via cutting) - + 4. Fix HADOOP-116. Clean up job submission files when jobs complete. (cutting) diff --git a/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/metrics2/impl/MetricsSourceAdapter.java b/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/metrics2/impl/MetricsSourceAdapter.java index cae9c3d7b4d..cf11e6db14e 100644 --- a/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/metrics2/impl/MetricsSourceAdapter.java +++ b/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/metrics2/impl/MetricsSourceAdapter.java @@ -173,8 +173,9 @@ class MetricsSourceAdapter implements DynamicMBean { } synchronized(this) { - updateAttrCache(); - if (getAllMetrics) { + int oldCacheSize = attrCache.size(); + int newCacheSize = updateAttrCache(); + if (oldCacheSize < newCacheSize) { updateInfoCache(); } jmxCacheTS = Time.now(); diff --git a/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/metrics2/impl/TestMetricsSourceAdapter.java b/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/metrics2/impl/TestMetricsSourceAdapter.java index 22b594aecf7..724d449fccd 100644 --- a/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/metrics2/impl/TestMetricsSourceAdapter.java +++ b/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/metrics2/impl/TestMetricsSourceAdapter.java @@ -23,8 +23,6 @@ import static org.junit.Assert.*; import java.util.ArrayList; import java.util.List; -import org.apache.hadoop.metrics2.MetricsCollector; -import org.apache.hadoop.metrics2.MetricsRecordBuilder; import org.apache.hadoop.metrics2.MetricsSource; import org.apache.hadoop.metrics2.MetricsTag; import org.apache.hadoop.metrics2.annotation.Metric; @@ -33,59 +31,10 @@ import org.apache.hadoop.metrics2.lib.MetricsAnnotations; import org.apache.hadoop.metrics2.lib.MetricsRegistry; import org.apache.hadoop.metrics2.lib.MetricsSourceBuilder; import org.apache.hadoop.metrics2.lib.MutableCounterLong; -import static org.apache.hadoop.metrics2.lib.Interns.info; -import static org.junit.Assert.assertEquals; - import org.junit.Test; -import javax.management.MBeanAttributeInfo; -import javax.management.MBeanInfo; - public class TestMetricsSourceAdapter { - - @Test - public void testPurgeOldMetrics() throws Exception { - // create test source with a single metric counter of value 1 - PurgableSource source = new PurgableSource(); - MetricsSourceBuilder sb = MetricsAnnotations.newSourceBuilder(source); - final MetricsSource s = sb.build(); - - List injectedTags = new ArrayList(); - MetricsSourceAdapter sa = new MetricsSourceAdapter( - "tst", "tst", "testdesc", s, injectedTags, null, null, 1, false); - - MBeanInfo info = sa.getMBeanInfo(); - boolean sawIt = false; - for (MBeanAttributeInfo mBeanAttributeInfo : info.getAttributes()) { - sawIt |= mBeanAttributeInfo.getName().equals(source.lastKeyName); - }; - assertTrue("The last generated metric is not exported to jmx", sawIt); - - Thread.sleep(1000); // skip JMX cache TTL - - info = sa.getMBeanInfo(); - sawIt = false; - for (MBeanAttributeInfo mBeanAttributeInfo : info.getAttributes()) { - sawIt |= mBeanAttributeInfo.getName().equals(source.lastKeyName); - }; - assertTrue("The last generated metric is not exported to jmx", sawIt); - } - - //generate a new key per each call - class PurgableSource implements MetricsSource { - int nextKey = 0; - String lastKeyName = null; - @Override - public void getMetrics(MetricsCollector collector, boolean all) { - MetricsRecordBuilder rb = - collector.addRecord("purgablesource") - .setContext("test"); - lastKeyName = "key" + nextKey++; - rb.addGauge(info(lastKeyName, "desc"), 1); - } - } - @Test public void testGetMetricsAndJmx() throws Exception { // create test source with a single metric counter of value 0