From 8597e9cf356b0d8e17600a49efc4c4a0356ecb5d Mon Sep 17 00:00:00 2001 From: Patrick Wendell Date: Wed, 27 Aug 2014 15:55:59 -0700 Subject: BUILD: Updating CHANGES.txt for Spark 1.1 --- CHANGES.txt | 14470 ++++++++++++++++++++++++++++ dev/create-release/generate-changelist.py | 4 +- 2 files changed, 14472 insertions(+), 2 deletions(-) create mode 100644 CHANGES.txt diff --git a/CHANGES.txt b/CHANGES.txt new file mode 100644 index 0000000000..6efb022574 --- /dev/null +++ b/CHANGES.txt @@ -0,0 +1,14470 @@ +Spark Change Log +---------------- + +Release 1.1.0 + + Add line continuation for script to work w/ py2.7.5 + Matthew Farrellee + 2014-08-27 15:50:30 -0700 + Commit: d4cf7a0, github.com/apache/spark/pull/2139 + + [SPARK-3235][SQL] Ensure in-memory tables don't always broadcast. + Michael Armbrust + 2014-08-27 15:14:08 -0700 + Commit: 9a62cf3, github.com/apache/spark/pull/2147 + + [SPARK-3065][SQL] Add locale setting to fix results do not match for udf_unix_timestamp format "yyyy MMM dd h:mm:ss a" run with not "America/Los_Angeles" TimeZone in HiveCompatibilitySuite + luogankun + 2014-08-27 15:08:22 -0700 + Commit: 5ea260e, github.com/apache/spark/pull/1968 + + [SQL] [SPARK-3236] Reading Parquet tables from Metastore mangles location + Aaron Davidson + 2014-08-27 15:05:47 -0700 + Commit: 7711687, github.com/apache/spark/pull/2150 + + [SPARK-3252][SQL] Add missing condition for test + viirya + 2014-08-27 14:55:05 -0700 + Commit: b3d763b, github.com/apache/spark/pull/2159 + + [SPARK-3243] Don't use stale spark-driver.* system properties + Andrew Or + 2014-08-27 14:46:56 -0700 + Commit: c1ffa3e, github.com/apache/spark/pull/2154 + + Spark-3213 Fixes issue with spark-ec2 not detecting slaves created with "Launch More like this" + Vida Ha + 2014-08-27 14:26:06 -0700 + Commit: 3cb4e17, github.com/apache/spark/pull/2163 + + [SPARK-3138][SQL] sqlContext.parquetFile should be able to take a single file as parameter + chutium + 2014-08-27 13:13:04 -0700 + Commit: 90f8f3e, github.com/apache/spark/pull/2044 + + [SPARK-3197] [SQL] Reduce the Expression tree object creations for aggregation function (min/max) + Cheng Hao + 2014-08-27 12:50:47 -0700 + Commit: 4c7f082, github.com/apache/spark/pull/2113 + + [SPARK-3118][SQL]add "SHOW TBLPROPERTIES tblname;" and "SHOW COLUMNS (FROM|IN) table_name [(FROM|IN) db_name]" support + u0jing + 2014-08-27 12:47:14 -0700 + Commit: 19cda07, github.com/apache/spark/pull/2034 + + SPARK-3259 - User data should be given to the master + Allan Douglas R. de Oliveira + 2014-08-27 12:43:22 -0700 + Commit: 0c94a5b, github.com/apache/spark/pull/2162 + + [SPARK-2608][Core] Fixed command line option passing issue over Mesos via SPARK_EXECUTOR_OPTS + Cheng Lian + 2014-08-27 12:39:21 -0700 + Commit: 935bffe, github.com/apache/spark/pull/2161 + + [SPARK-3239] [PySpark] randomize the dirs for each process + Davies Liu + 2014-08-27 10:40:35 -0700 + Commit: 092121e, github.com/apache/spark/pull/2152 + + [SPARK-3170][CORE][BUG]:RDD info loss in "StorageTab" and "ExecutorTab" + uncleGen + 2014-08-27 10:32:13 -0700 + Commit: 8f8e2a4, github.com/apache/spark/pull/2131 + + [SPARK-3154][STREAMING] Make FlumePollingInputDStream shutdown cleaner. + Hari Shreedharan + 2014-08-27 02:39:02 -0700 + Commit: 1d468df, github.com/apache/spark/pull/2065 + + [SPARK-3227] [mllib] Added migration guide for v1.0 to v1.1 + Joseph K. Bradley + 2014-08-27 01:45:59 -0700 + Commit: 7286d57, github.com/apache/spark/pull/2146 + + [SPARK-2830][MLLIB] doc update for 1.1 + Xiangrui Meng + 2014-08-27 01:19:48 -0700 + Commit: 7401247, github.com/apache/spark/pull/2151 + + [SPARK-3237][SQL] Fix parquet filters with UDFs + Michael Armbrust + 2014-08-27 00:59:23 -0700 + Commit: ca01de1, github.com/apache/spark/pull/2153 + + [SPARK-3139] Made ContextCleaner to not block on shuffles + Tathagata Das + 2014-08-27 00:13:38 -0700 + Commit: 5cf1e44, github.com/apache/spark/pull/2143 + + HOTFIX: Minor typo in conf template + Patrick Wendell + 2014-08-26 23:40:50 -0700 + Commit: 6f82a4b + + [SPARK-3167] Handle special driver configs in Windows (Branch 1.1) + Andrew Or + 2014-08-26 23:06:11 -0700 + Commit: e7672f1, github.com/apache/spark/pull/2156 + + [SPARK-3224] FetchFailed reduce stages should only show up once in failed stages (in UI) + Reynold Xin , Kay Ousterhout + 2014-08-26 21:59:48 -0700 + Commit: 2381e90, github.com/apache/spark/pull/2127 + + Fix unclosed HTML tag in Yarn docs. + Josh Rosen + 2014-08-26 18:55:00 -0700 + Commit: 7726e56 + + [SPARK-3036][SPARK-3037][SQL] Add MapType/ArrayType containing null value support to Parquet. + Takuya UESHIN + 2014-08-26 18:28:41 -0700 + Commit: 8b5af6f, github.com/apache/spark/pull/2032 + + [Docs] Run tests like in contributing guide + nchammas + 2014-08-26 17:50:04 -0700 + Commit: 0d97233, github.com/apache/spark/pull/2149 + + [SPARK-2964] [SQL] Remove duplicated code from spark-sql and start-thriftserver.sh + Cheng Lian , Kousuke Saruta + 2014-08-26 17:33:40 -0700 + Commit: c0e1f99, github.com/apache/spark/pull/1886 + + [SPARK-3194][SQL] Add AttributeSet to fix bugs with invalid comparisons of AttributeReferences + Michael Armbrust + 2014-08-26 16:29:14 -0700 + Commit: a308a16, github.com/apache/spark/pull/2109 + + [SPARK-2839][MLlib] Stats Toolkit documentation updated + Burak + 2014-08-26 15:18:42 -0700 + Commit: 2715eb7, github.com/apache/spark/pull/2130 + + [SPARK-3226][MLLIB] doc update for native libraries + Xiangrui Meng + 2014-08-26 15:12:27 -0700 + Commit: 5ff9000, github.com/apache/spark/pull/2128 + + [SPARK-3063][SQL] ExistingRdd should convert Map to catalyst Map. + Takuya UESHIN + 2014-08-26 15:04:08 -0700 + Commit: 5d981a4, github.com/apache/spark/pull/1963 + + [SPARK-2969][SQL] Make ScalaReflection be able to handle ArrayType.containsNull and MapType.valueContainsNull. + Takuya UESHIN + 2014-08-26 13:22:55 -0700 + Commit: 35a5853, github.com/apache/spark/pull/1889 + + [SPARK-2871] [PySpark] add histgram() API + Davies Liu + 2014-08-26 13:04:30 -0700 + Commit: 83d2730, github.com/apache/spark/pull/2091 + + [SPARK-3131][SQL] Allow user to set parquet compression codec for writing ParquetFile in SQLContext + chutium + 2014-08-26 11:51:26 -0700 + Commit: 3a9d874, github.com/apache/spark/pull/2039 + + [SPARK-2886] Use more specific actor system name than "spark" + Andrew Or + 2014-08-25 23:36:09 -0700 + Commit: 0f947f1, github.com/apache/spark/pull/1810 + + [Spark-3222] [SQL] Cross join support in HiveQL + Daoyuan Wang , adrian-wang + 2014-08-25 22:56:35 -0700 + Commit: 48a0749, github.com/apache/spark/pull/2124 + + SPARK-2481: The environment variables SPARK_HISTORY_OPTS is covered in spark-env.sh + witgo , GuoQiang Li + 2014-08-25 19:22:27 -0700 + Commit: 4d6a0e9, github.com/apache/spark/pull/1341 + + [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile + Chia-Yung Su + 2014-08-25 18:20:19 -0700 + Commit: b5dc9b4, github.com/apache/spark/pull/1959 + + [SQL] logWarning should be logInfo in getResultSetSchema + wangfei + 2014-08-25 17:46:43 -0700 + Commit: 957b356, github.com/apache/spark/pull/1939 + + [SPARK-3058] [SQL] Support EXTENDED for EXPLAIN + Cheng Hao + 2014-08-25 17:43:56 -0700 + Commit: f8ac8ed, github.com/apache/spark/pull/1962 + + [SPARK-2929][SQL] Refactored Thrift server and CLI suites + Cheng Lian + 2014-08-25 16:29:59 -0700 + Commit: 292f28d, github.com/apache/spark/pull/1856 + + [SPARK-3204][SQL] MaxOf would be foldable if both left and right are foldable. + Takuya UESHIN + 2014-08-25 16:27:00 -0700 + Commit: 19b01d6, github.com/apache/spark/pull/2116 + + Fixed a typo in docs/running-on-mesos.md + Cheng Lian + 2014-08-25 14:56:51 -0700 + Commit: 8d33a6d, github.com/apache/spark/pull/2119 + + [FIX] fix error message in sendMessageReliably + Xiangrui Meng + 2014-08-25 14:55:20 -0700 + Commit: d892062, github.com/apache/spark/pull/2120 + + SPARK-2798 [BUILD] Correct several small errors in Flume module pom.xml files + Sean Owen + 2014-08-25 13:29:07 -0700 + Commit: ff616fd, github.com/apache/spark/pull/1726 + + [SPARK-2495][MLLIB] make KMeans constructor public + Xiangrui Meng + 2014-08-25 12:30:02 -0700 + Commit: 69a17f1, github.com/apache/spark/pull/2112 + + [SPARK-2871] [PySpark] add zipWithIndex() and zipWithUniqueId() + Davies Liu + 2014-08-24 21:16:05 -0700 + Commit: b82da3d, github.com/apache/spark/pull/2092 + + [MLlib][SPARK-2997] Update SVD documentation to reflect roughly square + Reza Zadeh + 2014-08-24 17:35:54 -0700 + Commit: 749bddc, github.com/apache/spark/pull/2070 + + [SPARK-2841][MLlib] Documentation for feature transformations + DB Tsai + 2014-08-24 17:33:33 -0700 + Commit: a4db81a, github.com/apache/spark/pull/2068 + + [SPARK-3192] Some scripts have 2 space indentation but other scripts have 4 space indentation. + Kousuke Saruta + 2014-08-24 09:43:44 -0700 + Commit: ce14cd1, github.com/apache/spark/pull/2104 + + [SPARK-2967][SQL] Follow-up: Also copy hash expressions in sort based shuffle fix. + Michael Armbrust + 2014-08-23 16:21:08 -0700 + Commit: e23f0bc, github.com/apache/spark/pull/2072 + + [SPARK-2554][SQL] CountDistinct partial aggregation and object allocation improvements + Michael Armbrust , Gregory Owen + 2014-08-23 16:19:10 -0700 + Commit: 7112da8, github.com/apache/spark/pull/1935 + + [SQL] Make functionRegistry in HiveContext transient. + Yin Huai + 2014-08-23 12:46:41 -0700 + Commit: 9309786, github.com/apache/spark/pull/2074 + + [SPARK-2963] REGRESSION - The description about how to build for using CLI and Thrift JDBC server is absent in proper document - + Kousuke Saruta + 2014-08-22 22:28:05 -0700 + Commit: 5689660, github.com/apache/spark/pull/2080 + + [SPARK-3169] Removed dependency on spark streaming test from spark flume sink + Tathagata Das + 2014-08-22 21:34:48 -0700 + Commit: cd73631, github.com/apache/spark/pull/2101 + + Revert "HOTFIX:Temporarily removing flume sink test in 1.1 branch" + Patrick Wendell + 2014-08-22 21:31:52 -0700 + Commit: 385c4f2 + + [SPARK-2840] [mllib] DecisionTree doc update (Java, Python examples) + Joseph K. Bradley + 2014-08-21 00:17:29 -0700 + Commit: 1e5d9cb, github.com/apache/spark/pull/2063 + + BUILD: Bump Hadoop versions in the release build. + Patrick Wendell + 2014-08-20 12:18:41 -0700 + Commit: da0a701 + + HOTFIX:Temporarily removing flume sink test in 1.1 branch + Patrick Wendell + 2014-08-20 22:24:22 -0700 + Commit: 1d5e84a + + [HOTFIX][STREAMING] Allow the JVM/Netty to decide which port to bind to in Flume Polling Tests. + Hari Shreedharan + 2014-08-17 19:50:31 -0700 + Commit: 4485665, github.com/apache/spark/pull/1820 + + [HOTFIX][Streaming] Handle port collisions in flume polling test + Andrew Or + 2014-08-06 16:34:53 -0700 + Commit: 3f91e9d, github.com/apache/spark/pull/1803 + + [SPARK-2843][MLLIB] add a section about regularization parameter in ALS + Xiangrui Meng + 2014-08-20 17:47:39 -0700 + Commit: eba399b, github.com/apache/spark/pull/2064 + + [SPARK-3143][MLLIB] add tf-idf user guide + Xiangrui Meng + 2014-08-20 17:41:36 -0700 + Commit: 1af68ca, github.com/apache/spark/pull/2061 + + [SPARK-3140] Clarify confusing PySpark exception message + Andrew Or + 2014-08-20 17:07:39 -0700 + Commit: f8bcb12, github.com/apache/spark/pull/2067 + + [SPARK-2298] Encode stage attempt in SparkListener & UI. + Reynold Xin + 2014-08-20 15:37:27 -0700 + Commit: dc05282, github.com/apache/spark/pull/1545 + + [SPARK-2169] Don't copy appName / basePath everywhere. + Marcelo Vanzin + 2014-08-18 13:25:30 -0700 + Commit: 2c1683e, github.com/apache/spark/pull/1252 + + [SPARK-2846][SQL] Add configureInputJobPropertiesForStorageHandler to initialization of job conf + Alex Liu + 2014-08-20 16:14:06 -0700 + Commit: 64e136a, github.com/apache/spark/pull/1927 + + SPARK_LOGFILE and SPARK_ROOT_LOGGER no longer need in spark-daemon.sh + wangfei + 2014-08-20 16:00:46 -0700 + Commit: 5f72d7b, github.com/apache/spark/pull/2057 + + [SPARK-2967][SQL] Fix sort based shuffle for spark sql. + Michael Armbrust + 2014-08-20 15:51:14 -0700 + Commit: 311831d, github.com/apache/spark/pull/2066 + + [SPARK-2849] Handle driver configs separately in client mode + Andrew Or + 2014-08-20 15:01:47 -0700 + Commit: beb705a, github.com/apache/spark/pull/1845 + + [SPARK-3149] Connection establishment information is not enough. + Kousuke Saruta + 2014-08-20 14:04:39 -0700 + Commit: 25b01fd, github.com/apache/spark/pull/2060 + + [SPARK-3062] [SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled + Kousuke Saruta + 2014-08-20 13:26:11 -0700 + Commit: 5095851, github.com/apache/spark/pull/1970 + + [SPARK-3126][SPARK-3127][SQL] Fixed HiveThriftServer2Suite + Cheng Lian + 2014-08-20 12:57:39 -0700 + Commit: 99ca704, github.com/apache/spark/pull/2036 + + SPARK-3092 [SQL]: Always include the thriftserver when -Phive is enabled. + Patrick Wendell + 2014-08-20 12:13:31 -0700 + Commit: ca7322d, github.com/apache/spark/pull/2006 + + [SPARK-3054][STREAMING] Add unit tests for Spark Sink. + Hari Shreedharan , Hari Shreedharan + 2014-08-20 04:09:54 -0700 + Commit: 9b29099, github.com/apache/spark/pull/1958 + + [SPARK-3141] [PySpark] fix sortByKey() with take() + Davies Liu + 2014-08-19 22:43:49 -0700 + Commit: 5b22ebf, github.com/apache/spark/pull/2045 + + [DOCS] Fixed wrong links + Ken Takagiwa + 2014-08-19 22:43:22 -0700 + Commit: f8c908e, github.com/apache/spark/pull/2042 + + [SPARK-2974] [SPARK-2975] Fix two bugs related to spark.local.dirs + Josh Rosen + 2014-08-19 22:42:50 -0700 + Commit: 5d1a878, github.com/apache/spark/pull/2002 + + [SPARK-3142][MLLIB] output shuffle data directly in Word2Vec + Xiangrui Meng + 2014-08-19 22:16:22 -0700 + Commit: a5bc9c6, github.com/apache/spark/pull/2049 + + [SPARK-3119] Re-implementation of TorrentBroadcast. + Reynold Xin + 2014-08-19 22:11:13 -0700 + Commit: 08c9973, github.com/apache/spark/pull/2030 + + [HOTFIX][Streaming][MLlib] use temp folder for checkpoint + Xiangrui Meng + 2014-08-19 22:05:29 -0700 + Commit: d5db95b, github.com/apache/spark/pull/2046 + + [SPARK-3130][MLLIB] detect negative values in naive Bayes + Xiangrui Meng + 2014-08-19 21:01:23 -0700 + Commit: 148e45b, github.com/apache/spark/pull/2038 + + [SQL] add note of use synchronizedMap in SQLConf + wangfei , scwf + 2014-08-19 19:37:02 -0700 + Commit: 607735c, github.com/apache/spark/pull/1996 + + [SPARK-3112][MLLIB] Add documentation and example for StreamingLR + freeman + 2014-08-19 18:07:42 -0700 + Commit: d75464d, github.com/apache/spark/pull/2047 + + [MLLIB] minor update to word2vec + Xiangrui Meng + 2014-08-19 17:41:37 -0700 + Commit: 023ed7c, github.com/apache/spark/pull/2043 + + [SPARK-2468] Netty based block server / client module + Reynold Xin + 2014-08-19 17:40:35 -0700 + Commit: 66b4c81, github.com/apache/spark/pull/1971 + + [SPARK-3136][MLLIB] Create Java-friendly methods in RandomRDDs + Xiangrui Meng + 2014-08-19 16:06:48 -0700 + Commit: d371c71, github.com/apache/spark/pull/2041 + + [SPARK-2790] [PySpark] fix zip with serializers which have different batch sizes. + Davies Liu + 2014-08-19 14:46:32 -0700 + Commit: 3540d4b, github.com/apache/spark/pull/1894 + + Move a bracket in validateSettings of SparkConf + hzw19900416 + 2014-08-19 14:04:49 -0700 + Commit: f6b4ab8, github.com/apache/spark/pull/2012 + + SPARK-2333 - spark_ec2 script should allow option for existing security group + Vida Ha + 2014-08-19 13:35:05 -0700 + Commit: c3952b0, github.com/apache/spark/pull/1899 + + [SPARK-3128][MLLIB] Use streaming test suite for StreamingLR + freeman + 2014-08-19 13:28:57 -0700 + Commit: 04a3208, github.com/apache/spark/pull/2037 + + [SPARK-3089] Fix meaningless error message in ConnectionManager + Kousuke Saruta + 2014-08-19 10:15:11 -0700 + Commit: 5d895ad, github.com/apache/spark/pull/2000 + + [SPARK-3072] YARN - Exit when reach max number failed executors + Thomas Graves + 2014-08-19 09:40:31 -0500 + Commit: 1418893, github.com/apache/spark/pull/2022 + + Fix typo in decision tree docs + Matt Forbes + 2014-08-18 21:43:32 -0700 + Commit: f3b0f34, github.com/apache/spark/pull/1837 + + [SPARK-3116] Remove the excessive lockings in TorrentBroadcast + Reynold Xin + 2014-08-18 20:51:41 -0700 + Commit: b6d8e66, github.com/apache/spark/pull/2028 + + [SPARK-3114] [PySpark] Fix Python UDFs in Spark SQL. + Josh Rosen , Davies Liu + 2014-08-18 20:42:19 -0700 + Commit: 3a03259, github.com/apache/spark/pull/2026. + + [SPARK-3108][MLLIB] add predictOnValues to StreamingLR and fix predictOn + Xiangrui Meng + 2014-08-18 18:20:54 -0700 + Commit: 7d069bf, github.com/apache/spark/pull/2023 + + [SPARK-2850] [SPARK-2626] [mllib] MLlib stats examples + small fixes + Joseph K. Bradley + 2014-08-18 18:01:39 -0700 + Commit: e3f89e9, github.com/apache/spark/pull/1878 + + [mllib] DecisionTree: treeAggregate + Python example bug fix + Joseph K. Bradley + 2014-08-18 14:40:05 -0700 + Commit: 98778ff, github.com/apache/spark/pull/2015 + + [SPARK-2718] [yarn] Handle quotes and other characters in user args. + Marcelo Vanzin + 2014-08-18 14:10:10 -0700 + Commit: 25cabd7, github.com/apache/spark/pull/1724 + + [SPARK-3103] [PySpark] fix saveAsTextFile() with utf-8 + Davies Liu + 2014-08-18 13:58:35 -0700 + Commit: e083334, github.com/apache/spark/pull/2018 + + [SPARK-2406][SQL] Initial support for using ParquetTableScan to read HiveMetaStore tables. + Michael Armbrust , Yin Huai + 2014-08-18 13:17:10 -0700 + Commit: cc4015d, github.com/apache/spark/pull/1819 + + [SPARK-3091] [SQL] Add support for caching metadata on Parquet files + Matei Zaharia + 2014-08-18 11:00:10 -0700 + Commit: 2ae2857, github.com/apache/spark/pull/2005 + + SPARK-3025 [SQL]: Allow JDBC clients to set a fair scheduler pool + Patrick Wendell + 2014-08-18 10:52:20 -0700 + Commit: 496f62d, github.com/apache/spark/pull/1937 + + [SPARK-3085] [SQL] Use compact data structures in SQL joins + Matei Zaharia + 2014-08-18 10:45:24 -0700 + Commit: 4da76fc, github.com/apache/spark/pull/1993 + + [SPARK-3084] [SQL] Collect broadcasted tables in parallel in joins + Matei Zaharia + 2014-08-18 10:05:52 -0700 + Commit: 55e9dd6, github.com/apache/spark/pull/1990 + + SPARK-3096: Include parquet hive serde by default in build + Patrick Wendell + 2014-08-18 10:00:46 -0700 + Commit: ec0b91e, github.com/apache/spark/pull/2009 + + [SPARK-2862] histogram method fails on some choices of bucketCount + Chandan Kumar + 2014-08-18 09:52:25 -0700 + Commit: 12f16ba, github.com/apache/spark/pull/1787 + + [MLlib] Remove transform(dataset: RDD[String]) from Word2Vec public API + Liquan Pei + 2014-08-18 01:15:45 -0700 + Commit: e0bc333, github.com/apache/spark/pull/2010 + + [SPARK-2842][MLlib]Word2Vec documentation + Liquan Pei + 2014-08-17 23:30:47 -0700 + Commit: 518258f, github.com/apache/spark/pull/2003 + + [SPARK-3097][MLlib] Word2Vec performance improvement + Liquan Pei + 2014-08-17 23:29:44 -0700 + Commit: 708cde9, github.com/apache/spark/pull/1932 + + SPARK-2900. aggregate inputBytes per stage + Sandy Ryza + 2014-08-17 22:39:06 -0700 + Commit: 0506539, github.com/apache/spark/pull/1826 + + SPARK-2884: Create binary builds in parallel with release script. + Patrick Wendell + 2014-08-17 22:29:58 -0700 + Commit: a5ae720 + + [SPARK-3087][MLLIB] fix col indexing bug in chi-square and add a check for number of distinct values + Xiangrui Meng + 2014-08-17 20:53:18 -0700 + Commit: 8438daf, github.com/apache/spark/pull/1997 + + [SPARK-1981] updated streaming-kinesis.md + Chris Fregly + 2014-08-17 19:33:15 -0700 + Commit: 8263567, github.com/apache/spark/pull/1757 + + [SQL] Improve debug logging and toStrings. + Michael Armbrust + 2014-08-17 19:00:38 -0700 + Commit: 4f776df, github.com/apache/spark/pull/2004 + + Revert "[SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled" + Michael Armbrust + 2014-08-17 18:10:45 -0700 + Commit: c6a0091, github.com/apache/spark/pull/2007 + + SPARK-2881: Upgrade to Snappy 1.0.5.3 to avoid SPARK-2881. + Patrick Wendell + 2014-08-17 15:48:39 -0700 + Commit: d411f41, github.com/apache/spark/pull/1999 + + [SPARK-3042] [mllib] DecisionTree Filter top-down instead of bottom-up + Joseph K. Bradley + 2014-08-16 23:53:14 -0700 + Commit: 91af120, github.com/apache/spark/pull/1975 + + [SPARK-3077][MLLIB] fix some chisq-test + Xiangrui Meng + 2014-08-16 21:16:27 -0700 + Commit: 413a329, github.com/apache/spark/pull/1982 + + In the stop method of ConnectionManager to cancel the ackTimeoutMonitor + GuoQiang Li + 2014-08-16 20:05:55 -0700 + Commit: f02e327, github.com/apache/spark/pull/1989 + + [SPARK-1065] [PySpark] improve supporting for large broadcast + Davies Liu + 2014-08-16 16:59:34 -0700 + Commit: 5dd571c, github.com/apache/spark/pull/1912 + + [SPARK-3035] Wrong example with SparkContext.addFile + iAmGhost + 2014-08-16 16:48:38 -0700 + Commit: 721f2fd, github.com/apache/spark/pull/1942 + + [SPARK-3081][MLLIB] rename RandomRDDGenerators to RandomRDDs + Xiangrui Meng + 2014-08-16 15:14:43 -0700 + Commit: a12d3ae, github.com/apache/spark/pull/1979 + + [SPARK-3048][MLLIB] add LabeledPoint.parse and remove loadStreamingLabeledPoints + Xiangrui Meng + 2014-08-16 15:13:34 -0700 + Commit: 0b354be, github.com/apache/spark/pull/1952 + + [SPARK-2677] BasicBlockFetchIterator#next can wait forever + Kousuke Saruta + 2014-08-16 14:15:58 -0700 + Commit: bd3ce2f, github.com/apache/spark/pull/1632 + + [SQL] Using safe floating-point numbers in doctest + Cheng Lian + 2014-08-16 11:26:51 -0700 + Commit: 8c79574, github.com/apache/spark/pull/1925 + + [SPARK-2977] Ensure ShuffleManager is created before ShuffleBlockManager + Josh Rosen + 2014-08-16 00:04:55 -0700 + Commit: 0e0ec2e, github.com/apache/spark/pull/1976 + + [SPARK-3045] Make Serializer interface Java friendly + Reynold Xin + 2014-08-15 23:12:34 -0700 + Commit: fcf30cd, github.com/apache/spark/pull/1948 + + [SPARK-3015] Block on cleaning tasks to prevent Akka timeouts + Andrew Or + 2014-08-15 22:55:32 -0700 + Commit: 2541537, github.com/apache/spark/pull/1931 + + [SPARK-3001][MLLIB] Improve Spearman's correlation + Xiangrui Meng + 2014-08-15 21:07:55 -0700 + Commit: ce06d7f, github.com/apache/spark/pull/1917 + + [SPARK-3078][MLLIB] Make LRWithLBFGS API consistent with others + Xiangrui Meng + 2014-08-15 21:04:29 -0700 + Commit: c085011, github.com/apache/spark/pull/1973 + + [SPARK-3046] use executor's class loader as the default serializer classloader + Reynold Xin + 2014-08-15 17:04:15 -0700 + Commit: 077213b, github.com/apache/spark/pull/1972 + + [SPARK-3022] [SPARK-3041] [mllib] Call findBins once per level + unordered feature bug fix + Joseph K. Bradley + 2014-08-15 14:50:10 -0700 + Commit: 407ea9f, github.com/apache/spark/pull/1950 + + SPARK-3028. sparkEventToJson should support SparkListenerExecutorMetrics... + Sandy Ryza + 2014-08-15 11:35:08 -0700 + Commit: 63376a0, github.com/apache/spark/pull/1961 + + Revert "[SPARK-2468] Netty based block server / client module" + Patrick Wendell + 2014-08-15 09:01:35 -0700 + Commit: b066af4 + + [SPARK-2924] remove default args to overloaded methods + Anand Avati + 2014-08-15 08:53:52 -0700 + Commit: debb3e3, github.com/apache/spark/pull/1704 + + [SPARK-2468] Netty based block server / client module + Reynold Xin + 2014-08-14 19:01:33 -0700 + Commit: 3f23d2a, github.com/apache/spark/pull/1907 + + [SPARK-2936] Migrate Netty network module from Java to Scala + Reynold Xin + 2014-08-10 20:36:54 -0700 + Commit: d3cce58, github.com/apache/spark/pull/1865 + + [SPARK-2736] PySpark converter and example script for reading Avro files + Kan Zhang + 2014-08-14 19:03:51 -0700 + Commit: 72e730e, github.com/apache/spark/pull/1916 + + [SPARK-3027] TaskContext: tighten visibility and provide Java friendly callback API + Reynold Xin + 2014-08-14 18:37:02 -0700 + Commit: f99e4fc, github.com/apache/spark/pull/1938 + + Make dev/mima runnable on Mac OS X. + Reynold Xin + 2014-08-14 16:27:11 -0700 + Commit: 475a35b, github.com/apache/spark/pull/1953 + + SPARK-3009: Reverted readObject method in ApplicationInfo so that Applic... + Jacek Lewandowski + 2014-08-14 15:01:39 -0700 + Commit: f5d9176, github.com/apache/spark/pull/1947 + + Revert [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile + Michael Armbrust + 2014-08-14 13:00:21 -0700 + Commit: c39a3f3, github.com/apache/spark/pull/1949 + + [SPARK-2979][MLlib] Improve the convergence rate by minimizing the condition number + DB Tsai + 2014-08-14 11:56:13 -0700 + Commit: dc8ef93, github.com/apache/spark/pull/1897 + + Minor cleanup of metrics.Source + Reynold Xin + 2014-08-14 11:22:41 -0700 + Commit: a3dc54f, github.com/apache/spark/pull/1943 + + [SPARK-2925] [sql]fix spark-sql and start-thriftserver shell bugs when set --driver-java-options + wangfei , wangfei + 2014-08-14 10:55:51 -0700 + Commit: df25acd, github.com/apache/spark/pull/1851 + + [SQL] Python JsonRDD UTF8 Encoding Fix + Ahir Reddy + 2014-08-14 10:48:52 -0700 + Commit: 850abaa, github.com/apache/spark/pull/1914 + + [SPARK-2927][SQL] Add a conf to configure if we always read Binary columns stored in Parquet as String columns + Yin Huai + 2014-08-14 10:46:33 -0700 + Commit: de501e1, github.com/apache/spark/pull/1855 + + [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile + Chia-Yung Su + 2014-08-14 10:43:08 -0700 + Commit: 221c84e, github.com/apache/spark/pull/1924 + + SPARK-2893: Do not swallow Exceptions when running a custom kryo registrator + Graham Dennis + 2014-08-14 02:24:18 -0700 + Commit: af809de, github.com/apache/spark/pull/1827 + + [SPARK-3029] Disable local execution of Spark jobs by default + Aaron Davidson + 2014-08-14 01:37:38 -0700 + Commit: 0cb2b82, github.com/apache/spark/pull/1321 + + [SPARK-2995][MLLIB] add ALS.setIntermediateRDDStorageLevel + Xiangrui Meng + 2014-08-13 23:53:44 -0700 + Commit: 1baf06f, github.com/apache/spark/pull/1913 + + [Docs] Add missing tags (minor) + Andrew Or + 2014-08-13 23:24:23 -0700 + Commit: bf7c6e1, github.com/apache/spark/pull/1936 + + [SPARK-3006] Failed to execute spark-shell in Windows OS + Masayoshi TSUZUKI + 2014-08-13 22:17:07 -0700 + Commit: dcd99c3, github.com/apache/spark/pull/1918 + + SPARK-3020: Print completed indices rather than tasks in web UI + Patrick Wendell + 2014-08-13 18:08:38 -0700 + Commit: c6cb55a, github.com/apache/spark/pull/1933 + + [SPARK-2986] [SQL] fixed: setting properties does not effect + guowei + 2014-08-13 17:45:24 -0700 + Commit: a8d2649, github.com/apache/spark/pull/1904 + + [SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled + Kousuke Saruta + 2014-08-13 17:42:38 -0700 + Commit: b5b632c, github.com/apache/spark/pull/1891 + + [SPARK-2935][SQL]Fix parquet predicate push down bug + Michael Armbrust + 2014-08-13 17:40:59 -0700 + Commit: e8e7f17, github.com/apache/spark/pull/1863 + + [SPARK-2650][SQL] More precise initial buffer size estimation for in-memory column buffer + Cheng Lian + 2014-08-13 17:37:55 -0700 + Commit: ee7d2cc, github.com/apache/spark/pull/1901 + + [SPARK-2994][SQL] Support for udfs that take complex types + Michael Armbrust + 2014-08-13 17:35:38 -0700 + Commit: 71b8408, github.com/apache/spark/pull/1915 + + [SPARK-2817] [SQL] add "show create table" support + tianyi , tianyi , tianyi + 2014-08-13 16:50:02 -0700 + Commit: 0fb1198, github.com/apache/spark/pull/1760 + + [SPARK-3004][SQL] Added null checking when retrieving row set + Cheng Lian + 2014-08-13 16:27:50 -0700 + Commit: 8732375, github.com/apache/spark/pull/1920 + + [MLLIB] use Iterator.fill instead of Array.fill + Xiangrui Meng + 2014-08-13 16:20:49 -0700 + Commit: e63bf87, github.com/apache/spark/pull/1930 + + [SPARK-2983] [PySpark] improve performance of sortByKey() + Davies Liu + 2014-08-13 14:57:12 -0700 + Commit: a7bc21c, github.com/apache/spark/pull/1898 + + [SPARK-3013] [SQL] [PySpark] convert array into list + Davies Liu + 2014-08-13 14:56:11 -0700 + Commit: 9936020, github.com/apache/spark/pull/1928 + + [SPARK-2963] [SQL] There no documentation about building to use HiveServer and CLI for SparkSQL + Kousuke Saruta + 2014-08-13 14:42:57 -0700 + Commit: 78f2f99, github.com/apache/spark/pull/1885 + + [SPARK-2993] [MLLib] colStats (wrapper around MultivariateStatisticalSummary) in Statistics + Doris Xin + 2014-08-12 23:47:42 -0700 + Commit: 5ebeb3f, github.com/apache/spark/pull/1911 + + [SPARK-1777 (partial)] bugfix: make size of requested memory correctly + Zhang, Liye + 2014-08-12 23:43:36 -0700 + Commit: ec5e2b0, github.com/apache/spark/pull/1892 + + Use transferTo when copy merge files in ExternalSorter + Raymond Liu + 2014-08-12 23:19:35 -0700 + Commit: be674b3, github.com/apache/spark/pull/1884 + + [SPARK-2953] Allow using short names for io compression codecs + Reynold Xin + 2014-08-12 22:50:29 -0700 + Commit: 837bf60, github.com/apache/spark/pull/1873 + + SPARK-2830 [MLlib]: re-organize mllib documentation + Ameet Talwalkar + 2014-08-12 17:15:21 -0700 + Commit: cffd9bb, github.com/apache/spark/pull/1908 + + fix flaky tests + Davies Liu + 2014-08-12 16:26:01 -0700 + Commit: b5f8083, github.com/apache/spark/pull/1910 + + [MLlib] Correctly set vectorSize and alpha + Liquan Pei + 2014-08-12 00:28:00 -0700 + Commit: 2a8117a, github.com/apache/spark/pull/1900 + + [SPARK-2923][MLLIB] Implement some basic BLAS routines + Xiangrui Meng + 2014-08-11 22:33:45 -0700 + Commit: 872c170, github.com/apache/spark/pull/1849 + + [SQL] [SPARK-2826] Reduce the memory copy while building the hashmap for HashOuterJoin + Cheng Hao + 2014-08-11 20:45:14 -0700 + Commit: f66f260, github.com/apache/spark/pull/1765 + + [SPARK-2650][SQL] Build column buffers in smaller batches + Michael Armbrust + 2014-08-11 20:21:56 -0700 + Commit: 779d1eb, github.com/apache/spark/pull/1880 + + [SPARK-2968][SQL] Fix nullabilities of Explode. + Takuya UESHIN + 2014-08-11 20:18:03 -0700 + Commit: 54b387f, github.com/apache/spark/pull/1888 + + [SPARK-2965][SQL] Fix HashOuterJoin output nullabilities. + Takuya UESHIN + 2014-08-11 20:15:01 -0700 + Commit: dcbf079, github.com/apache/spark/pull/1887 + + [SQL] A tiny refactoring in HiveContext#analyze + Yin Huai + 2014-08-11 20:11:29 -0700 + Commit: fd8173f, github.com/apache/spark/pull/1881 + + [sql]use SparkSQLEnv.stop() in ShutdownHook + wangfei + 2014-08-11 20:10:13 -0700 + Commit: 6d0af52, github.com/apache/spark/pull/1852 + + [SPARK-2590][SQL] Added option to handle incremental collection, disabled by default + Cheng Lian + 2014-08-11 20:08:06 -0700 + Commit: cf2f807, github.com/apache/spark/pull/1853 + + [SPARK-2844][SQL] Correctly set JVM HiveContext if it is passed into Python HiveContext constructor + Ahir Reddy + 2014-08-11 20:06:06 -0700 + Commit: 8cb4e5b, github.com/apache/spark/pull/1768 + + [SPARK-2934][MLlib] Adding LogisticRegressionWithLBFGS Interface + DB Tsai + 2014-08-11 19:49:29 -0700 + Commit: 8f6e2e9, github.com/apache/spark/pull/1862 + + [SPARK-2515][mllib] Chi Squared test + Doris Xin + 2014-08-11 19:22:14 -0700 + Commit: 7e31f7c, github.com/apache/spark/pull/1733 + + [SPARK-2931] In TaskSetManager, reset currentLocalityIndex after recomputing locality levels + Josh Rosen + 2014-08-11 19:15:01 -0700 + Commit: 6c64d57, github.com/apache/spark/pull/1896 + + [SPARK-2952] Enable logging actor messages at DEBUG level + Reynold Xin + 2014-08-11 15:25:21 -0700 + Commit: 6ec1374, github.com/apache/spark/pull/1870 + + [PySpark] [SPARK-2954] [SPARK-2948] [SPARK-2910] [SPARK-2101] Python 2.6 Fixes + Josh Rosen + 2014-08-11 11:54:09 -0700 + Commit: 09b8a3c, github.com/apache/spark/pull/1868. + + [SPARK-2937] Separate out samplyByKeyExact as its own API in PairRDDFunction + Doris Xin , Xiangrui Meng + 2014-08-10 16:31:07 -0700 + Commit: 3def842, github.com/apache/spark/pull/1866 + + [SPARK-2898] [PySpark] fix bugs in deamon.py + Davies Liu + 2014-08-10 13:00:38 -0700 + Commit: 92daffe, github.com/apache/spark/pull/1842 + + Remove extra semicolon in Task.scala + GuoQiang Li + 2014-08-10 12:12:22 -0700 + Commit: bb23b11, github.com/apache/spark/pull/1876 + + Turn UpdateBlockInfo into case class. + Reynold Xin + 2014-08-09 23:06:54 -0700 + Commit: 076ddda, github.com/apache/spark/pull/1872 + + Updated Spark SQL README to include the hive-thriftserver module + Reynold Xin + 2014-08-09 22:05:36 -0700 + Commit: e8f8e5f, github.com/apache/spark/pull/1867 + + [SPARK-2894] spark-shell doesn't accept flags + Kousuke Saruta , Cheng Lian + 2014-08-09 21:10:43 -0700 + Commit: ba223b8, github.com/apache/spark/pull/1715, + + [SPARK-1766] sorted functions to meet pedantic requirements + Chris Cope + 2014-08-09 20:58:56 -0700 + Commit: 4a7f3ef, github.com/apache/spark/pull/1859 + + [SPARK-2861] Fix Doc comment of histogram method + Chandan Kumar + 2014-08-09 00:45:54 -0700 + Commit: 71fcd2e, github.com/apache/spark/pull/1786 + + [SPARK-2635] Fix race condition at SchedulerBackend.isReady in standalone mode + li-zhihui , Li Zhihui + 2014-08-08 22:52:56 -0700 + Commit: 3311da2, github.com/apache/spark/pull/1525 + + [SPARK-2897][SPARK-2920]TorrentBroadcast does use the serializer class specified in the spark option "spark.serializer" + GuoQiang Li + 2014-08-08 16:57:26 -0700 + Commit: dd11e4e, github.com/apache/spark/pull/1836 + + [SPARK-1997][MLLIB] update breeze to 0.9 + Xiangrui Meng + 2014-08-08 15:07:31 -0700 + Commit: 8fba6de, github.com/apache/spark/pull/1749 + + [SPARK-2700] [SQL] Hidden files (such as .impala_insert_staging) should be filtered out by sqlContext.parquetFile + chutium + 2014-08-08 13:31:08 -0700 + Commit: e264503, github.com/apache/spark/pull/1691 + + [SPARK-2919] [SQL] Basic support for analyze command in HiveQl + Yin Huai + 2014-08-08 11:23:58 -0700 + Commit: daa090f, github.com/apache/spark/pull/1848 + + [SPARK-2877] [SQL] MetastoreRelation should use SparkClassLoader when creating the tableDesc + Yin Huai + 2014-08-08 11:15:16 -0700 + Commit: 8b0188b, github.com/apache/spark/pull/1806 + + [SPARK-2908] [SQL] JsonRDD.nullTypeToStringType does not convert all NullType to StringType + Yin Huai + 2014-08-08 11:10:11 -0700 + Commit: 544a909, github.com/apache/spark/pull/1840 + + [SPARK-2888] [SQL] Fix addColumnMetadataToConf in HiveTableScan + Yin Huai + 2014-08-08 11:01:51 -0700 + Commit: 3eb5dd0, github.com/apache/spark/pull/1817 + + [SPARK-2904] Remove non-used local variable in SparkSubmitArguments + Kousuke Saruta + 2014-08-07 18:53:15 -0700 + Commit: a54b5d9, github.com/apache/spark/pull/1834 + + SPARK-2565. Update ShuffleReadMetrics as blocks are fetched + Sandy Ryza + 2014-08-07 18:09:03 -0700 + Commit: aab7735, github.com/apache/spark/pull/1507 + + SPARK-2787: Make sort-based shuffle write files directly when there's no sorting/aggregation and # partitions is small + Matei Zaharia + 2014-08-07 18:04:49 -0700 + Commit: 0f2274f, github.com/apache/spark/pull/1799 + + SPARK-2899 Doc generation is back to working in new SBT Build. + Prashant Sharma + 2014-08-07 16:24:22 -0700 + Commit: 30369b8, github.com/apache/spark/pull/1830 + + SPARK-2905 Fixed path sbin => bin + Oleg Danilov + 2014-08-07 15:48:44 -0700 + Commit: c65c810, github.com/apache/spark/pull/1835 + + [SPARK-2852][MLLIB] Separate model from IDF/StandardScaler algorithms + Xiangrui Meng + 2014-08-07 11:28:12 -0700 + Commit: f705c1d, github.com/apache/spark/pull/1814 + + [mllib] DecisionTree Strategy parameter checks + Joseph K. Bradley + 2014-08-07 00:20:38 -0700 + Commit: c089429, github.com/apache/spark/pull/1821 + + SPARK-2879 part 2 [BUILD] Use HTTPS to access Maven Central and other repos + Sean Owen + 2014-08-07 00:04:18 -0700 + Commit: d6cd6fd0, github.com/apache/spark/pull/1828 + + [SPARK-2851] [mllib] DecisionTree Python consistency update + Joseph K. Bradley + 2014-08-06 22:58:59 -0700 + Commit: c9f0944, github.com/apache/spark/pull/1798 + + [SPARK-2887] fix bug of countApproxDistinct() when have more than one partition + Davies Liu + 2014-08-06 21:22:13 -0700 + Commit: cc8a7e9, github.com/apache/spark/pull/1812 + + Updating versions for Spark 1.1.0 + Patrick Wendell + 2014-08-06 19:11:39 -0700 + Commit: cf35b56 + + HOTFIX: Support custom Java 7 location + Patrick Wendell + 2014-08-06 18:45:03 -0700 + Commit: 53fa048 + + SPARK-2879 [BUILD] Use HTTPS to access Maven Central and other repos + Sean Owen + 2014-08-06 18:13:35 -0700 + Commit: 40284a9, github.com/apache/spark/pull/1805 + + [SPARK-2583] ConnectionManager error reporting + Kousuke Saruta , Josh Rosen + 2014-08-06 17:27:55 -0700 + Commit: 3f92ce4, github.com/apache/spark/pull/1758 + + SPARK-2882: Spark build now checks local maven cache for dependencies + Gregory Owen + 2014-08-06 16:52:00 -0700 + Commit: c2ae0b0, github.com/apache/spark/pull/1818 + + [PySpark] Add blanklines to Python docstrings so example code renders correctly + RJ Nowling + 2014-08-06 14:12:21 -0700 + Commit: a314e29, github.com/apache/spark/pull/1808 + + [SPARK-2852][MLLIB] API consistency for `mllib.feature` + Xiangrui Meng + 2014-08-06 14:07:51 -0700 + Commit: e654cfd, github.com/apache/spark/pull/1807 + + SPARK-2566. Update ShuffleWriteMetrics incrementally + Sandy Ryza + 2014-08-06 13:10:33 -0700 + Commit: a65c9ac, github.com/apache/spark/pull/1481 + + [SPARK-2627] [PySpark] have the build enforce PEP 8 automatically + Nicholas Chammas , nchammas + 2014-08-06 12:58:24 -0700 + Commit: 4c19614, github.com/apache/spark/pull/1744 + + [SPARK-2678][Core][SQL] A workaround for SPARK-2678 + Cheng Lian + 2014-08-06 12:28:35 -0700 + Commit: cf8e7fd, github.com/apache/spark/pull/1801 + + [SPARK-2875] [PySpark] [SQL] handle null in schemaRDD() + Davies Liu + 2014-08-06 11:08:12 -0700 + Commit: 27a8d4c, github.com/apache/spark/pull/1802 + + [SPARK-2157] Enable tight firewall rules for Spark + Andrew Or , Andrew Ash + 2014-08-06 00:07:40 -0700 + Commit: 31090e4, github.com/apache/spark/pull/1777 + + [SPARK-1022][Streaming][HOTFIX] Fixed zookeeper dependency of Kafka + Tathagata Das + 2014-08-05 23:41:34 -0700 + Commit: 5b4bc84, github.com/apache/spark/pull/1797 + + [MLlib] Use this.type as return type in k-means' builder pattern + DB Tsai + 2014-08-05 23:32:29 -0700 + Commit: aec217a, github.com/apache/spark/pull/1796 + + SPARK-2294: fix locality inversion bug in TaskManager + CodingCat + 2014-08-05 23:02:58 -0700 + Commit: 1da2fdf, github.com/apache/spark/pull/1313 + + [SQL] Fix logging warn -> debug + Michael Armbrust + 2014-08-05 22:30:32 -0700 + Commit: 0482055, github.com/apache/spark/pull/1800 + + [SQL] Tighten the visibility of various SQLConf methods and renamed setter/getters + Reynold Xin + 2014-08-05 22:29:19 -0700 + Commit: 4f0b4f4, github.com/apache/spark/pull/1794 + + [SPARK-2806] core - upgrade to json4s-jackson 3.2.10 + Anand Avati + 2014-08-05 21:59:10 -0700 + Commit: 6da8f41, github.com/apache/spark/pull/1702 + + [SPARK-2866][SQL] Support attributes in ORDER BY that aren't in SELECT + Michael Armbrust + 2014-08-05 20:55:02 -0700 + Commit: 936f61e, github.com/apache/spark/pull/1795 + + [SPARK-2854][SQL] Finalize _acceptable_types in pyspark.sql + Yin Huai + 2014-08-05 18:56:10 -0700 + Commit: a10e1b0, github.com/apache/spark/pull/1793 + + [SPARK-2650][SQL] Try to partially fix SPARK-2650 by adjusting initial buffer size and reducing memory allocation + Cheng Lian + 2014-08-05 18:50:37 -0700 + Commit: 4233b02, github.com/apache/spark/pull/1769 + + [sql] rename project name in pom.xml of hive-thriftserver module + wangfei + 2014-08-05 18:30:02 -0700 + Commit: 152e36c, github.com/apache/spark/pull/1789 + + SPARK-2869 - Fix tiny bug in JdbcRdd for closing jdbc connection + Stephen Boesch , Stephen Boesch + 2014-08-05 18:18:08 -0700 + Commit: 58247a8, github.com/apache/spark/pull/1792 + + [SPARK-2550][MLLIB][APACHE SPARK] Support regularization and intercept in pyspark's linear methods + Michael Giannakopoulos + 2014-08-05 16:30:32 -0700 + Commit: 672904e, github.com/apache/spark/pull/1775 + + [SPARK-2503] Lower shuffle output buffer (spark.shuffle.file.buffer.kb) to 32KB. + Reynold Xin + 2014-08-05 16:24:50 -0700 + Commit: 0172277, github.com/apache/spark/pull/1781 + + [SPARK-2856] Decrease initial buffer size for Kryo to 64KB. + Reynold Xin + 2014-08-05 01:30:46 -0700 + Commit: 5081b0d, github.com/apache/spark/pull/1780 + + [SPARK-2864][MLLIB] fix random seed in word2vec; move model to local + Xiangrui Meng + 2014-08-05 16:22:41 -0700 + Commit: e77fa81, github.com/apache/spark/pull/1790 + + SPARK-1680: use configs for specifying environment variables on YARN + Thomas Graves + 2014-08-05 15:57:32 -0500 + Commit: 7b798e1, github.com/apache/spark/pull/1512 + + SPARK-2380: Support displaying accumulator values in the web UI + Patrick Wendell + 2014-08-05 13:08:23 -0700 + Commit: 46b6983, github.com/apache/spark/pull/1309 + + [SPARK-2859] Update url of Kryo project in related docs + Guancheng (G.C.) Chen + 2014-08-05 11:50:08 -0700 + Commit: 0f541ab, github.com/apache/spark/pull/1782 + + [SPARK-2860][SQL] Fix coercion of CASE WHEN. + Michael Armbrust + 2014-08-05 11:17:50 -0700 + Commit: 388ab53, github.com/apache/spark/pull/1785 + + SPARK-1890 and SPARK-1891- add admin and modify acls + Thomas Graves + 2014-08-05 12:52:52 -0500 + Commit: e3fe657, github.com/apache/spark/pull/1196 + + SPARK-1528 - spark on yarn, add support for accessing remote HDFS + Thomas Graves + 2014-08-05 12:48:26 -0500 + Commit: 6c0c65f, github.com/apache/spark/pull/1159 + + [SPARK-1022][Streaming] Add Kafka real unit test + jerryshao + 2014-08-05 10:40:28 -0700 + Commit: b92a450, github.com/apache/spark/pull/1751 + + [SPARK-1779] Throw an exception if memory fractions are not between 0 and 1 + wangfei , wangfei + 2014-08-05 00:51:07 -0700 + Commit: 075ba67, github.com/apache/spark/pull/714 + + [SPARK-2857] Correct properties to set Master / Worker ports + Andrew Or + 2014-08-05 00:39:07 -0700 + Commit: 12f99cf, github.com/apache/spark/pull/1779 + + SPARK-2711. Create a ShuffleMemoryManager to track memory for all spilling collections + Matei Zaharia + 2014-08-04 23:41:03 -0700 + Commit: d13d253, github.com/apache/spark/pull/1707 + + SPARK-2685. Update ExternalAppendOnlyMap to avoid buffer.remove() + Matei Zaharia + 2014-08-04 23:27:53 -0700 + Commit: a092285, github.com/apache/spark/pull/1773 + + [SPARK-2323] Exception in accumulator update should not crash DAGScheduler & SparkContext + Reynold Xin + 2014-08-04 20:39:18 -0700 + Commit: 4ed7b5a, github.com/apache/spark/pull/1772 + + [SPARK-1687] [PySpark] fix unit tests related to pickable namedtuple + Davies Liu + 2014-08-04 15:54:52 -0700 + Commit: 2225d18, github.com/apache/spark/pull/1771 + + SPARK-2792. Fix reading too much or too little data from each stream in ExternalMap / Sorter + Matei Zaharia + 2014-08-04 12:59:18 -0700 + Commit: aa7a48e, github.com/apache/spark/pull/1722 + + [SPARK-1687] [PySpark] pickable namedtuple + Davies Liu + 2014-08-04 12:13:41 -0700 + Commit: bfd2f39, github.com/apache/spark/pull/1623 + + [MLlib] [SPARK-2510]Word2Vec: Distributed Representation of Words + Liquan Pei , Xiangrui Meng , Liquan Pei + 2014-08-03 23:55:58 -0700 + Commit: 3823f6d, github.com/apache/spark/pull/1719 + + SPARK-2272 [MLlib] Feature scaling which standardizes the range of independent variables or features of data + DB Tsai + 2014-08-03 21:39:21 -0700 + Commit: 9aa1459, github.com/apache/spark/pull/1207 + + Fix some bugs with spaces in directory name. + Sarah Gerweck + 2014-08-03 19:47:05 -0700 + Commit: 2152e24, github.com/apache/spark/pull/1756 + + [SPARK-2810] upgrade to scala-maven-plugin 3.2.0 + Anand Avati + 2014-08-03 17:47:49 -0700 + Commit: 4784d24, github.com/apache/spark/pull/1711 + + [SPARK-1740] [PySpark] kill the python worker + Davies Liu + 2014-08-03 15:52:00 -0700 + Commit: a4cdb77, github.com/apache/spark/pull/1643 + + [SPARK-2783][SQL] Basic support for analyze in HiveContext + Yin Huai + 2014-08-03 14:54:41 -0700 + Commit: 7c6afda, github.com/apache/spark/pull/1741 + + [SPARK-2814][SQL] HiveThriftServer2 throws NPE when executing native commands + Cheng Lian + 2014-08-03 12:34:46 -0700 + Commit: 6ffdcc6, github.com/apache/spark/pull/1753 + + [SPARK-2784][SQL] Deprecate hql() method in favor of a config option, 'spark.sql.dialect' + Michael Armbrust + 2014-08-03 12:28:29 -0700 + Commit: c5ed1de, github.com/apache/spark/pull/1746 + + [SPARK-2197] [mllib] Java DecisionTree bug fix and easy-of-use + Joseph K. Bradley + 2014-08-03 10:36:52 -0700 + Commit: eaa9355, github.com/apache/spark/pull/1740 + + SPARK-2246: Add user-data option to EC2 scripts + Allan Douglas R. de Oliveira + 2014-08-03 10:25:59 -0700 + Commit: 162fc95, github.com/apache/spark/pull/1186 + + SPARK-2712 - Add a small note to maven doc that mvn package must happen ... + Stephen Boesch + 2014-08-03 10:19:04 -0700 + Commit: 1992175, github.com/apache/spark/pull/1615 + + [Minor] Fixes on top of #1679 + Andrew Or + 2014-08-02 22:00:46 -0700 + Commit: fb2a207, github.com/apache/spark/pull/1736 + + SPARK-2414 [BUILD] Add LICENSE entry for jquery + Sean Owen + 2014-08-02 21:55:56 -0700 + Commit: c137928, github.com/apache/spark/pull/1748 + + SPARK-2602 [BUILD] Tests steal focus under Java 6 + Sean Owen + 2014-08-02 21:44:19 -0700 + Commit: 0d47bb6, github.com/apache/spark/pull/1747 + + [SPARK-2739][SQL] Rename registerAsTable to registerTempTable + Michael Armbrust + 2014-08-02 18:27:04 -0700 + Commit: 5b30e00, github.com/apache/spark/pull/1743 + + [SPARK-2797] [SQL] SchemaRDDs don't support unpersist() + Yin Huai + 2014-08-02 17:55:22 -0700 + Commit: 5ef8282, github.com/apache/spark/pull/1745 + + [SPARK-2729][SQL] Added test case for SPARK-2729 + Cheng Lian + 2014-08-02 17:12:49 -0700 + Commit: 460fad8, github.com/apache/spark/pull/1738 + + [SPARK-2785][SQL] Remove assertions that throw when users try unsupported Hive commands. + Michael Armbrust + 2014-08-02 16:48:07 -0700 + Commit: 4230df4, github.com/apache/spark/pull/1742 + + [SPARK-2097][SQL] UDF Support + Michael Armbrust + 2014-08-02 16:33:48 -0700 + Commit: 3b9f25f, github.com/apache/spark/pull/1063 + + SPARK-2804: Remove scalalogging-slf4j dependency + GuoQiang Li + 2014-08-02 13:55:28 -0700 + Commit: 7924d72, github.com/apache/spark/pull/also + + [SPARK-1981] Add AWS Kinesis streaming support + Chris Fregly + 2014-08-02 13:35:35 -0700 + Commit: bb0ac6d, github.com/apache/spark/pull/1434 + + [SQL] Set outputPartitioning of BroadcastHashJoin correctly. + Yin Huai + 2014-08-02 13:16:41 -0700 + Commit: 91de0dc, github.com/apache/spark/pull/1735 + + [SPARK-2478] [mllib] DecisionTree Python API + Joseph K. Bradley + 2014-08-02 13:07:17 -0700 + Commit: 8d6ac2b, github.com/apache/spark/pull/1727 + + [HOTFIX] Do not throw NPE if spark.test.home is not set + Andrew Or + 2014-08-02 12:11:50 -0700 + Commit: e221108, github.com/apache/spark/pull/1739 + + MAINTENANCE: Automated closing of pull requests. + Patrick Wendell + 2014-08-02 01:26:16 -0700 + Commit: 87738bf, github.com/apache/spark/pull/706 + + HOTFIX: Fix concurrency issue in FlumePollingStreamSuite. + Patrick Wendell + 2014-08-02 01:11:03 -0700 + Commit: 44460ba + + HOTFIX: Fixing test error in maven for flume-sink. + Patrick Wendell + 2014-08-02 00:57:47 -0700 + Commit: 25cad6a + + [SPARK-1812] sql/catalyst - Provide explicit type information + Anand Avati + 2014-08-02 00:48:17 -0700 + Commit: 08c095b, github.com/apache/spark/pull/1709 + + [SPARK-2454] Do not ship spark home to Workers + Andrew Or + 2014-08-02 00:45:38 -0700 + Commit: 148af60, github.com/apache/spark/pull/1734 + + [SPARK-2316] Avoid O(blocks) operations in listeners + Andrew Or + 2014-08-01 23:56:24 -0700 + Commit: d934801, github.com/apache/spark/pull/1679 + + Revert "[SPARK-1470][SPARK-1842] Use the scala-logging wrapper instead of the directly sfl4j api" + Patrick Wendell + 2014-08-01 23:55:30 -0700 + Commit: dab3796 + + [SPARK-1470][SPARK-1842] Use the scala-logging wrapper instead of the directly sfl4j api + GuoQiang Li + 2014-08-01 23:55:11 -0700 + Commit: adc8303, github.com/apache/spark/pull/1369 + + StatCounter on NumPy arrays [PYSPARK][SPARK-2012] + Jeremy Freeman + 2014-08-01 22:33:25 -0700 + Commit: 4bc3bb2, github.com/apache/spark/pull/1725 + + [SPARK-2801][MLlib]: DistributionGenerator renamed to RandomDataGenerator. RandomRDD is now of generic type + Burak + 2014-08-01 22:32:12 -0700 + Commit: fda4759, github.com/apache/spark/pull/1732 + + [SPARK-1580][MLLIB] Estimate ALS communication and computation costs. + Tor Myklebust , Xiangrui Meng + 2014-08-01 21:25:02 -0700 + Commit: e25ec06, github.com/apache/spark/pull/493 + + [SPARK-2550][MLLIB][APACHE SPARK] Support regularization and intercept in pyspark's linear methods. + Michael Giannakopoulos + 2014-08-01 21:00:31 -0700 + Commit: c281189, github.com/apache/spark/pull/1624 + + Streaming mllib [SPARK-2438][MLLIB] + Jeremy Freeman , freeman + 2014-08-01 20:10:26 -0700 + Commit: f6a1899, github.com/apache/spark/pull/1361 + + [SPARK-2764] Simplify daemon.py process structure + Josh Rosen + 2014-08-01 19:38:21 -0700 + Commit: e8e0fd6, github.com/apache/spark/pull/1680 + + [SPARK-2800]: Exclude scalastyle-output.xml Apache RAT checks + GuoQiang Li + 2014-08-01 19:35:16 -0700 + Commit: a38d3c9, github.com/apache/spark/pull/1729 + + [SPARK-2116] Load spark-defaults.conf from SPARK_CONF_DIR if set + Albert Chu + 2014-08-01 19:00:38 -0700 + Commit: 0da07da, github.com/apache/spark/pull/1059 + + [SPARK-2212][SQL] Hash Outer Join (follow-up bug fix). + Yin Huai + 2014-08-01 18:52:01 -0700 + Commit: 3822f33, github.com/apache/spark/pull/1721 + + [SPARK-2010] [PySpark] [SQL] support nested structure in SchemaRDD + Davies Liu + 2014-08-01 18:47:41 -0700 + Commit: 880eabe, github.com/apache/spark/pull/1598 + + [SPARK-2796] [mllib] DecisionTree bug fix: ordered categorical features + Joseph K. Bradley + 2014-08-01 15:52:21 -0700 + Commit: 7058a53, github.com/apache/spark/pull/1720 + + [SPARK-2786][mllib] Python correlations + Doris Xin + 2014-08-01 15:02:17 -0700 + Commit: d88e695, github.com/apache/spark/pull/1713 + + SPARK-2791: Fix committing, reverting and state tracking in shuffle file consolidation + Aaron Davidson + 2014-08-01 13:57:19 -0700 + Commit: 78f2af5, github.com/apache/spark/pull/1678 + + [SPARK-2379] Fix the bug that streaming's receiver may fall into a dead loop + joyyoj + 2014-08-01 13:41:55 -0700 + Commit: b270309, github.com/apache/spark/pull/1694 + + SPARK-1612: Fix potential resource leaks + zsxwing + 2014-08-01 13:25:04 -0700 + Commit: f5d9bea, github.com/apache/spark/pull/535 + + [SPARK-2490] Change recursive visiting on RDD dependencies to iterative approach + Liang-Chi Hsieh + 2014-08-01 12:12:30 -0700 + Commit: baf9ce1, github.com/apache/spark/pull/1418 + + [SPARK-695] In DAGScheduler's getPreferredLocs, track set of visited partitions. + Aaron Staple + 2014-08-01 12:04:04 -0700 + Commit: eb5bdca, github.com/apache/spark/pull/1362 + + [SQL] Documentation: Explain cacheTable command + CrazyJvm + 2014-08-01 11:46:13 -0700 + Commit: c82fe47, github.com/apache/spark/pull/1681 + + [SPARK-2767] [SQL] SparkSQL CLI doens't output error message if query failed. + Cheng Hao + 2014-08-01 11:42:05 -0700 + Commit: c0b47ba, github.com/apache/spark/pull/1686 + + [SPARK-2729] [SQL] Forgot to match Timestamp type in ColumnBuilder + chutium + 2014-08-01 11:31:44 -0700 + Commit: 580c701, github.com/apache/spark/pull/1636 + + [SQL][SPARK-2212]Hash Outer Join + Cheng Hao + 2014-08-01 11:27:12 -0700 + Commit: 4415722, github.com/apache/spark/pull/1147 + + [SPARK-2179][SQL] A minor refactoring Java data type APIs (2179 follow-up). + Yin Huai + 2014-08-01 11:14:53 -0700 + Commit: c41fdf0, github.com/apache/spark/pull/1712 + + SPARK-2099. Report progress while task is running. + Sandy Ryza + 2014-08-01 11:08:39 -0700 + Commit: 8d338f6, github.com/apache/spark/pull/1056 + + [HOTFIX] downgrade breeze version to 0.7 + Xiangrui Meng + 2014-08-01 10:00:46 -0700 + Commit: 5328c0a, github.com/apache/spark/pull/1718 + + [SPARK-1997] update breeze to version 0.8.1 + witgo + 2014-08-01 07:47:44 -0700 + Commit: 0dacb1a, github.com/apache/spark/pull/940 + + SPARK-2768 [MLLIB] Add product, user recommend method to MatrixFactorizationModel + Sean Owen + 2014-08-01 07:32:53 -0700 + Commit: 82d209d, github.com/apache/spark/pull/1687 + + [SPARK-2103][Streaming] Change to ClassTag for KafkaInputDStream and fix reflection issue + jerryshao + 2014-08-01 04:32:46 -0700 + Commit: a32f0fb, github.com/apache/spark/pull/1508 + + [Spark 2557] fix LOCAL_N_REGEX in createTaskScheduler and make local-n and local-n-failures consistent + Ye Xianjin + 2014-08-01 00:34:39 -0700 + Commit: 284771e, github.com/apache/spark/pull/1464 + + SPARK-2134: Report metrics before application finishes + Rahul Singhal + 2014-08-01 00:33:15 -0700 + Commit: f1957e1, github.com/apache/spark/pull/1076 + + SPARK-983. Support external sorting in sortByKey() + Matei Zaharia + 2014-08-01 00:16:18 -0700 + Commit: 72e3369, github.com/apache/spark/pull/931 + + [SPARK-2670] FetchFailedException should be thrown when local fetch has failed + Kousuke Saruta + 2014-08-01 00:01:30 -0700 + Commit: 8ff4417, github.com/apache/spark/pull/1578 + + SPARK-2738. Remove redundant imports in BlockManagerSuite + Sandy Ryza + 2014-07-31 23:12:38 -0700 + Commit: cb9e7d5, github.com/apache/spark/pull/1642 + + SPARK-2632, SPARK-2576. Fixed by only importing what is necessary during class definition. + Prashant Sharma , Yin Huai , Prashant Sharma + 2014-07-31 22:57:13 -0700 + Commit: 1499101, github.com/apache/spark/pull/1635 + + [SPARK-2702][Core] Upgrade Tachyon dependency to 0.5.0 + Haoyuan Li + 2014-07-31 22:53:42 -0700 + Commit: 2cdc3e5, github.com/apache/spark/pull/1651 + + [SPARK-2782][mllib] Bug fix for getRanks in SpearmanCorrelation + Doris Xin + 2014-07-31 21:23:35 -0700 + Commit: c475540, github.com/apache/spark/pull/1710 + + [SPARK-2777][MLLIB] change ALS factors storage level to MEMORY_AND_DISK + Xiangrui Meng + 2014-07-31 21:14:08 -0700 + Commit: b190083, github.com/apache/spark/pull/1700 + + SPARK-2766: ScalaReflectionSuite throw an llegalArgumentException in JDK 6 + GuoQiang Li + 2014-07-31 21:06:57 -0700 + Commit: 9998efa, github.com/apache/spark/pull/1683 + + [SPARK-2779] [SQL] asInstanceOf[Map[...]] should use scala.collection.Map instead of scala.collection.immutable.Map + Yin Huai + 2014-07-31 21:02:11 -0700 + Commit: 9632719, github.com/apache/spark/pull/1705 + + [SPARK-2756] [mllib] Decision tree bug fixes + Joseph K. Bradley + 2014-07-31 20:51:48 -0700 + Commit: b124de5, github.com/apache/spark/pull/1673 + + [SPARK-2724] Python version of RandomRDDGenerators + Doris Xin + 2014-07-31 20:32:57 -0700 + Commit: d843014, github.com/apache/spark/pull/1628 + + [SPARK-2531 & SPARK-2436] [SQL] Optimize the BuildSide when planning BroadcastNestedLoopJoin. + Zongheng Yang + 2014-07-31 19:32:16 -0700 + Commit: 8f51491, github.com/apache/spark/pull/1448 + + SPARK-2282: Reuse Socket for sending accumulator updates to Pyspark + Aaron Davidson + 2014-07-31 15:31:53 -0700 + Commit: ef4ff00, github.com/apache/spark/pull/1503 + + SPARK-2740: allow user to specify ascending and numPartitions for sortBy... + Rui Li + 2014-07-31 15:07:26 -0700 + Commit: 492a195, github.com/apache/spark/pull/1645 + + Docs: monitoring, streaming programming guide + kballou + 2014-07-31 14:58:52 -0700 + Commit: cc82050, github.com/apache/spark/pull/1662 + + Improvements to merge_spark_pr.py + Josh Rosen + 2014-07-31 14:35:09 -0700 + Commit: e021362, github.com/apache/spark/pull/1668 + + [SPARK-2523] [SQL] Hadoop table scan bug fixing (fix failing Jenkins maven test) + Yin Huai + 2014-07-31 13:05:24 -0700 + Commit: 49b3612, github.com/apache/spark/pull/1669 + + [SPARK-2511][MLLIB] add HashingTF and IDF + Xiangrui Meng + 2014-07-31 12:55:00 -0700 + Commit: dc0865b, github.com/apache/spark/pull/1671 + + SPARK-2646. log4j initialization not quite compatible with log4j 2.x + Sean Owen + 2014-07-31 12:26:36 -0700 + Commit: e5749a1, github.com/apache/spark/pull/1547 + + SPARK-2749 [BUILD] Part 2. Fix a follow-on scalastyle error + Sean Owen + 2014-07-31 12:18:40 -0700 + Commit: 4dbabb3, github.com/apache/spark/pull/1690 + + SPARK-2664. Deal with `--conf` options in spark-submit that relate to fl... + Sandy Ryza + 2014-07-31 11:51:20 -0700 + Commit: f68105d, github.com/apache/spark/pull/1665 + + SPARK-2028: Expose mapPartitionsWithInputSplit in HadoopRDD + Aaron Davidson + 2014-07-31 11:35:38 -0700 + Commit: f193312, github.com/apache/spark/pull/973 + + [SPARK-2397][SQL] Deprecate LocalHiveContext + Michael Armbrust + 2014-07-31 11:26:43 -0700 + Commit: 72cfb13, github.com/apache/spark/pull/1641 + + [SPARK-2743][SQL] Resolve original attributes in ParquetTableScan + Michael Armbrust + 2014-07-31 11:15:25 -0700 + Commit: 3072b96, github.com/apache/spark/pull/1647 + + [SPARK-2762] SparkILoop leaks memory in multi-repl configurations + Timothy Hunter + 2014-07-31 10:25:40 -0700 + Commit: 92ca910, github.com/apache/spark/pull/1674 + + automatically set master according to `spark.master` in `spark-defaults.... + CrazyJvm + 2014-07-30 23:37:25 -0700 + Commit: 669e3f0, github.com/apache/spark/pull/1644 + + [SPARK-2497] Included checks for module symbols too. + Prashant Sharma + 2014-07-30 22:46:30 -0700 + Commit: 5a110da, github.com/apache/spark/pull/1463 + + [SPARK-2737] Add retag() method for changing RDDs' ClassTags. + Josh Rosen + 2014-07-30 22:40:57 -0700 + Commit: 4fb2593, github.com/apache/spark/pull/1639 + + [SPARK-2340] Resolve event logging and History Server paths properly + Andrew Or + 2014-07-30 21:57:32 -0700 + Commit: a7c305b, github.com/apache/spark/pull/1280 + + Required AM memory is "amMem", not "args.amMemory" + derek ma + 2014-07-30 21:37:59 -0700 + Commit: 118c1c4, github.com/apache/spark/pull/1494 + + [SPARK-2758] UnionRDD's UnionPartition should not reference parent RDDs + Reynold Xin + 2014-07-30 21:30:13 -0700 + Commit: 894d48f, github.com/apache/spark/pull/1675 + + SPARK-2045 Sort-based shuffle + Matei Zaharia + 2014-07-30 18:07:59 -0700 + Commit: e966284, github.com/apache/spark/pull/1499 + + Update DecisionTreeRunner.scala + strat0sphere + 2014-07-30 17:57:50 -0700 + Commit: da50176, github.com/apache/spark/pull/1676 + + SPARK-2341 [MLLIB] loadLibSVMFile doesn't handle regression datasets + Sean Owen + 2014-07-30 17:34:32 -0700 + Commit: e9b275b, github.com/apache/spark/pull/1663 + + [SPARK-2734][SQL] Remove tables from cache when DROP TABLE is run. + Michael Armbrust + 2014-07-30 17:30:51 -0700 + Commit: 88a519d, github.com/apache/spark/pull/1650 + + SPARK-2741 - Publish version of spark assembly which does not contain Hive + Brock Noland + 2014-07-30 17:04:30 -0700 + Commit: 2ac37db, github.com/apache/spark/pull/1667 + + SPARK-2749 [BUILD]. Spark SQL Java tests aren't compiling in Jenkins' Maven builds; missing junit:junit dep + Sean Owen + 2014-07-30 15:04:33 -0700 + Commit: 6ab96a6, github.com/apache/spark/pull/1660 + + Properly pass SBT_MAVEN_PROFILES into sbt. + Reynold Xin + 2014-07-30 14:31:20 -0700 + Commit: 2f4b170 + + Set AMPLAB_JENKINS_BUILD_PROFILE. + Reynold Xin + 2014-07-30 14:08:24 -0700 + Commit: 1097327 + + Wrap JAR_DL in dev/check-license. + Reynold Xin + 2014-07-30 13:42:43 -0700 + Commit: 7c7ce54 + + [SPARK-2024] Add saveAsSequenceFile to PySpark + Kan Zhang + 2014-07-30 13:19:05 -0700 + Commit: 94d1f46, github.com/apache/spark/pull/1338 + + dev/check-license wrap folders in quotes. + Reynold Xin + 2014-07-30 13:17:14 -0700 + Commit: 437dc8c + + [SQL] Fix compiling of catalyst docs. + Michael Armbrust + 2014-07-30 13:11:09 -0700 + Commit: 2248891, github.com/apache/spark/pull/1653 + + More wrapping FWDIR in quotes. + Reynold Xin + 2014-07-30 13:04:20 -0700 + Commit: 0feb349 + + Wrap FWDIR in quotes in dev/check-license. + Reynold Xin + 2014-07-30 12:33:42 -0700 + Commit: 95cf203 + + Wrap FWDIR in quotes. + Reynold Xin + 2014-07-30 12:24:35 -0700 + Commit: f2eb84f + + [SPARK-2746] Set SBT_MAVEN_PROFILES only when it is not set explicitly by the user. + Reynold Xin + 2014-07-30 11:45:24 -0700 + Commit: ff511ba, github.com/apache/spark/pull/1655 + + [SPARK-2544][MLLIB] Improve ALS algorithm resource usage + GuoQiang Li , witgo + 2014-07-30 11:00:11 -0700 + Commit: fc47bb6, github.com/apache/spark/pull/929 + + Avoid numerical instability + Naftali Harris + 2014-07-30 09:56:59 -0700 + Commit: e3d85b7, github.com/apache/spark/pull/1652 + + [SPARK-2747] git diff --dirstat can miss sql changes and not run Hive tests + Reynold Xin + 2014-07-30 09:28:53 -0700 + Commit: 3bc3f18, github.com/apache/spark/pull/1656 + + [SPARK-2521] Broadcast RDD object (instead of sending it along with every task) + Reynold Xin + 2014-07-30 09:27:43 -0700 + Commit: 774142f, github.com/apache/spark/pull/1498 + + SPARK-2748 [MLLIB] [GRAPHX] Loss of precision for small arguments to Math.exp, Math.log + Sean Owen + 2014-07-30 08:55:15 -0700 + Commit: ee07541, github.com/apache/spark/pull/1659 + + SPARK-2543: Allow user to set maximum Kryo buffer size + Koert Kuipers + 2014-07-30 00:18:59 -0700 + Commit: 7c5fc28, github.com/apache/spark/pull/735 + + [SPARK-2179][SQL] Public API for DataTypes and Schema + Yin Huai + 2014-07-30 00:15:31 -0700 + Commit: 7003c16, github.com/apache/spark/pull/1346 + + [SPARK-2260] Fix standalone-cluster mode, which was broken + Andrew Or + 2014-07-29 23:52:09 -0700 + Commit: 4ce92cc, github.com/apache/spark/pull/1538 + + [SQL] Handle null values in debug() + Michael Armbrust + 2014-07-29 22:42:54 -0700 + Commit: 077f633, github.com/apache/spark/pull/1646 + + [SPARK-2568] RangePartitioner should run only one job if data is balanced + Xiangrui Meng , Reynold Xin + 2014-07-29 22:16:20 -0700 + Commit: 2e6efca, github.com/apache/spark/pull/1562 + + [SPARK-2054][SQL] Code Generation for Expression Evaluation + Michael Armbrust + 2014-07-29 20:58:05 -0700 + Commit: 8446746, github.com/apache/spark/pull/993 + + [SPARK-2305] [PySpark] Update Py4J to version 0.8.2.1 + Josh Rosen + 2014-07-29 19:02:06 -0700 + Commit: 22649b6, github.com/apache/spark/pull/1626 + + [SPARK-2631][SQL] Use SQLConf to configure in-memory columnar caching + Michael Armbrust + 2014-07-29 18:20:51 -0700 + Commit: 86534d0, github.com/apache/spark/pull/1638 + + [SPARK-2716][SQL] Don't check resolved for having filters. + Michael Armbrust + 2014-07-29 18:14:20 -0700 + Commit: 39b8193, github.com/apache/spark/pull/1640 + + MAINTENANCE: Automated closing of pull requests. + Patrick Wendell + 2014-07-29 17:52:48 -0700 + Commit: 2c35666, github.com/apache/spark/pull/740 + + [SPARK-2393][SQL] Cost estimation optimization framework for Catalyst logical plans & sample usage. + Zongheng Yang + 2014-07-29 15:32:50 -0700 + Commit: c7db274, github.com/apache/spark/pull/1238 + + [SPARK-2082] stratified sampling in PairRDDFunctions that guarantees exact sample size + Doris Xin , Xiangrui Meng + 2014-07-29 12:49:44 -0700 + Commit: dc96536, github.com/apache/spark/pull/1025 + + [SPARK-2674] [SQL] [PySpark] support datetime type for SchemaRDD + Davies Liu + 2014-07-29 12:31:39 -0700 + Commit: f0d880e, github.com/apache/spark/pull/1601 + + [SPARK-2730][SQL] When retrieving a value from a Map, GetItem evaluates key twice + Yin Huai + 2014-07-29 12:23:34 -0700 + Commit: e364348, github.com/apache/spark/pull/1637 + + [SQL]change some test lists + Daoyuan + 2014-07-29 12:22:48 -0700 + Commit: 0c5c6a6, github.com/apache/spark/pull/1634 + + [STREAMING] SPARK-1729. Make Flume pull data from source, rather than the current pu... + Hari Shreedharan , Hari Shreedharan , Tathagata Das , harishreedharan + 2014-07-29 11:11:29 -0700 + Commit: 800ecff, github.com/apache/spark/pull/807 + + Minor indentation and comment typo fixes. + Aaron Staple + 2014-07-29 01:35:26 -0700 + Commit: fc4d057, github.com/apache/spark/pull/1630 + + [SPARK-2174][MLLIB] treeReduce and treeAggregate + Xiangrui Meng + 2014-07-29 01:16:41 -0700 + Commit: 20424da, github.com/apache/spark/pull/1110 + + [SPARK-2726] and [SPARK-2727] Remove SortOrder and do in-place sort. + Reynold Xin + 2014-07-29 01:12:44 -0700 + Commit: 96ba04b, github.com/apache/spark/pull/1631 + + [SPARK-791] [PySpark] fix pickle itemgetter with cloudpickle + Davies Liu + 2014-07-29 01:02:18 -0700 + Commit: 92ef026, github.com/apache/spark/pull/1627 + + [SPARK-2580] [PySpark] keep silent in worker if JVM close the socket + Davies Liu + 2014-07-29 00:15:45 -0700 + Commit: ccd5ab5, github.com/apache/spark/pull/1625 + + Excess judgment + Yadong Qi + 2014-07-28 21:39:02 -0700 + Commit: 16ef4d1, github.com/apache/spark/pull/1629 + + Use commons-lang3 in SignalLogger rather than commons-lang + Aaron Davidson + 2014-07-28 13:37:44 -0700 + Commit: 39ab87b, github.com/apache/spark/pull/1621 + + [SPARK-2410][SQL] Merging Hive Thrift/JDBC server (with Maven profile fix) + Cheng Lian + 2014-07-28 12:07:30 -0700 + Commit: a7a9d14, github.com/apache/spark/pull/1620 + + [SPARK-2479][MLlib] Comparing floating-point numbers using relative error in UnitTests + DB Tsai + 2014-07-28 11:34:19 -0700 + Commit: 255b56f, github.com/apache/spark/pull/1425 + + [SPARK-2523] [SQL] Hadoop table scan bug fixing + Cheng Hao + 2014-07-28 10:59:53 -0700 + Commit: 2b8d89e, github.com/apache/spark/pull/1439 + + [SPARK-1550] [PySpark] Allow SparkContext creation after failed attempts + Josh Rosen + 2014-07-27 22:54:43 -0700 + Commit: a7d145e, github.com/apache/spark/pull/1606 + + SPARK-2651: Add maven scalastyle plugin + Rahul Singhal + 2014-07-27 18:50:32 -0700 + Commit: d7eac4c, github.com/apache/spark/pull/1550 + + Revert "[SPARK-2410][SQL] Merging Hive Thrift/JDBC server" + Patrick Wendell + 2014-07-27 18:46:58 -0700 + Commit: e5bbce9 + + [SPARK-2514] [mllib] Random RDD generator + Doris Xin + 2014-07-27 16:16:39 -0700 + Commit: 81fcdd2, github.com/apache/spark/pull/1520 + + [SPARK-1777] Prevent OOMs from single partitions + Andrew Or + 2014-07-27 16:08:16 -0700 + Commit: ecf30ee, github.com/apache/spark/pull/1165 + + [SPARK-2410][SQL] Merging Hive Thrift/JDBC server + Cheng Lian + 2014-07-27 13:03:38 -0700 + Commit: f6ff2a6, github.com/apache/spark/pull/1600 + + [SPARK-2705][CORE] Fixed stage description in stage info page + Cheng Lian + 2014-07-27 12:35:21 -0700 + Commit: 2bbf235, github.com/apache/spark/pull/1524 + + SPARK-2684: Update ExternalAppendOnlyMap to take an iterator as input + Matei Zaharia + 2014-07-27 11:20:20 -0700 + Commit: 9857053, github.com/apache/spark/pull/1607 + + [SPARK-2679] [MLLib] Ser/De for Double + Doris Xin + 2014-07-27 07:21:07 -0700 + Commit: 3a69c72, github.com/apache/spark/pull/1581 + + [SPARK-2361][MLLIB] Use broadcast instead of serializing data directly into task closure + Xiangrui Meng + 2014-07-26 22:56:07 -0700 + Commit: aaf2b73, github.com/apache/spark/pull/1427 + + SPARK-2680: Lower spark.shuffle.memoryFraction to 0.2 by default + Matei Zaharia + 2014-07-26 22:44:17 -0700 + Commit: b547f69, github.com/apache/spark/pull/1593 + + [SPARK-2601] [PySpark] Fix Py4J error when transforming pickleFiles + Josh Rosen + 2014-07-26 17:37:05 -0700 + Commit: ba46bbe, github.com/apache/spark/pull/1605 + + [SPARK-2704] Name threads in ConnectionManager and mark them as daemon. + Reynold Xin + 2014-07-26 15:00:32 -0700 + Commit: 1290164, github.com/apache/spark/pull/1604 + + [SPARK-2279] Added emptyRDD method to Java API + bpaulin + 2014-07-26 10:27:09 -0700 + Commit: c183b92, github.com/apache/spark/pull/1597 + + [SPARK-2652] [PySpark] Turning some default configs for PySpark + Davies Liu + 2014-07-26 01:07:08 -0700 + Commit: 75663b5, github.com/apache/spark/pull/1568 + + [SPARK-2696] Reduce default value of spark.serializer.objectStreamReset + Hossein + 2014-07-26 01:04:56 -0700 + Commit: 66f26a4, github.com/apache/spark/pull/1595 + + [SPARK-1458] [PySpark] Expose sc.version in Java and PySpark + Josh Rosen + 2014-07-26 00:54:05 -0700 + Commit: cf3e9fd, github.com/apache/spark/pull/1596 + + [SPARK-2659][SQL] Fix division semantics for hive + Michael Armbrust + 2014-07-25 19:17:49 -0700 + Commit: 8904791, github.com/apache/spark/pull/1557 + + Part of [SPARK-2456] Removed some HashMaps from DAGScheduler by storing information in Stage. + Reynold Xin + 2014-07-25 18:45:02 -0700 + Commit: 9d8666c, github.com/apache/spark/pull/1561 + + Revert "[SPARK-2410][SQL] Merging Hive Thrift/JDBC server" + Michael Armbrust + 2014-07-25 15:36:57 -0700 + Commit: afd757a, github.com/apache/spark/pull/1594 + + [SPARK-1726] [SPARK-2567] Eliminate zombie stages in UI. + Kay Ousterhout + 2014-07-25 15:14:13 -0700 + Commit: 37ad3b7, github.com/apache/spark/pull/1566 + + [SPARK-2125] Add sort flag and move sort into shuffle implementations + jerryshao + 2014-07-25 14:34:38 -0700 + Commit: 47b6b38, github.com/apache/spark/pull/1210 + + [SQL]Update HiveMetastoreCatalog.scala + baishuo(白硕) + 2014-07-25 13:59:45 -0700 + Commit: ab3c6a4, github.com/apache/spark/pull/1569 + + [SPARK-2682] Javadoc generated from Scala source code is not in javadoc's index + Yin Huai + 2014-07-25 13:00:13 -0700 + Commit: a19d8c8, github.com/apache/spark/pull/1584 + + [SPARK-2410][SQL] Merging Hive Thrift/JDBC server + Cheng Lian + 2014-07-25 12:20:49 -0700 + Commit: 06dc0d2, github.com/apache/spark/pull/1399 + + [SPARK-2683] unidoc failed because org.apache.spark.util.CallSite uses Java keywords as value names + Yin Huai + 2014-07-25 11:14:51 -0700 + Commit: 32bcf9a, github.com/apache/spark/pull/1585 + + replace println to log4j + fireflyc + 2014-07-25 10:47:52 -0700 + Commit: a2715cc, github.com/apache/spark/pull/1372 + + [SPARK-2665] [SQL] Add EqualNS & Unit Tests + Cheng Hao + 2014-07-25 01:30:22 -0700 + Commit: 184aa1c, github.com/apache/spark/pull/1570 + + [SPARK-2529] Clean closures in foreach and foreachPartition. + Reynold Xin + 2014-07-25 01:10:05 -0700 + Commit: eb82abd, github.com/apache/spark/pull/1583 + + SPARK-2657 Use more compact data structures than ArrayBuffer in groupBy & cogroup + Matei Zaharia + 2014-07-25 00:32:32 -0700 + Commit: 8529ced, github.com/apache/spark/pull/1555 + + [SPARK-2656] Python version of stratified sampling + Doris Xin + 2014-07-24 23:42:08 -0700 + Commit: 2f75a4a, github.com/apache/spark/pull/1554 + + [SPARK-2538] [PySpark] Hash based disk spilling aggregation + Davies Liu + 2014-07-24 22:53:47 -0700 + Commit: 14174ab, github.com/apache/spark/pull/1460 + + [SPARK-2014] Make PySpark store RDDs in MEMORY_ONLY_SER with compression by default + Prashant Sharma + 2014-07-24 18:15:37 -0700 + Commit: eff9714, github.com/apache/spark/pull/1051 + + [SPARK-2464][Streaming] Fixed Twitter stream stopping bug + Tathagata Das + 2014-07-24 15:59:09 -0700 + Commit: a45d548, github.com/apache/spark/pull/1577 + + SPARK-2250: show stage RDDs in UI + Neville Li + 2014-07-24 14:13:00 -0700 + Commit: fec641b, github.com/apache/spark/pull/1188 + + [SPARK-2037]: yarn client mode doesn't support spark.yarn.max.executor.failures + GuoQiang Li + 2014-07-24 14:46:10 -0500 + Commit: 323a83c, github.com/apache/spark/pull/1180 + + [SPARK-2479 (partial)][MLLIB] fix binary metrics unit tests + Xiangrui Meng + 2014-07-24 12:37:02 -0700 + Commit: c960b50, github.com/apache/spark/pull/1576 + + [SPARK-2603][SQL] Remove unnecessary toMap and toList in converting Java collections to Scala collections JsonRDD.scala + Yin Huai + 2014-07-24 11:19:19 -0700 + Commit: b352ef1, github.com/apache/spark/pull/1504 + + [Build] SPARK-2619: Configurable filemode for the spark/bin folder in debian package + tzolov + 2014-07-24 11:12:25 -0700 + Commit: 9fd1414, github.com/apache/spark/pull/1531 + + SPARK-2150: Provide direct link to finished application UI in yarn resou... + Rahul Singhal + 2014-07-24 09:31:04 -0500 + Commit: 46e224a, github.com/apache/spark/pull/1094 + + [SPARK-2661][bagel]unpersist old processed rdd + Daoyuan + 2014-07-24 00:09:36 -0700 + Commit: 42dfab7, github.com/apache/spark/pull/1519 + + SPARK-2310. Support arbitrary Spark properties on the command line with ... + Sandy Ryza + 2014-07-23 23:09:25 -0700 + Commit: e34922a, github.com/apache/spark/pull/1253 + + [SPARK-2658][SQL] Add rule for true = 1. + Michael Armbrust + 2014-07-23 22:52:49 -0700 + Commit: 78d18fd, github.com/apache/spark/pull/1556 + + SPARK-2662: Fix NPE for JsonProtocol + GuoQiang Li + 2014-07-23 22:50:39 -0700 + Commit: 9e7725c, github.com/apache/spark/pull/1511 + + Replace RoutingTableMessage with pair + Ankur Dave + 2014-07-23 20:11:28 -0700 + Commit: 2d25e34, github.com/apache/spark/pull/1553 + + [SPARK-2484][SQL] Build should not run hivecompatibility tests by default. + witgo + 2014-07-23 18:17:05 -0700 + Commit: 60f0ae3, github.com/apache/spark/pull/1403 + + [SPARK-2549] Functions defined inside of other functions trigger failures + Prashant Sharma + 2014-07-23 17:12:28 -0700 + Commit: 9b76332, github.com/apache/spark/pull/1510 + + [SPARK-2102][SQL][CORE] Add option for kryo registration required and use a resource pool in Spark SQL for Kryo instances. + Ian O Connell + 2014-07-23 16:30:06 -0700 + Commit: efdaeb1, github.com/apache/spark/pull/1377 + + [SPARK-2569][SQL] Fix shipping of TEMPORARY hive UDFs. + Michael Armbrust + 2014-07-23 16:26:55 -0700 + Commit: 1871574, github.com/apache/spark/pull/1552 + + SPARK-2226: [SQL] transform HAVING clauses with aggregate expressions that aren't in the aggregation list + William Benton + 2014-07-23 16:25:32 -0700 + Commit: e060d3e, github.com/apache/spark/pull/1497 + + SPARK-2277: clear host->rack info properly + Rui Li + 2014-07-23 16:23:24 -0700 + Commit: 91903e0, github.com/apache/spark/pull/1454 + + [SPARK-2588][SQL] Add some more DSLs. + Takuya UESHIN + 2014-07-23 14:47:23 -0700 + Commit: 1b790cf, github.com/apache/spark/pull/1491 + + [CORE] SPARK-2640: In "local[N]", free cores of the only executor should be touched by "spark.task.cpus" for every finish/start-up of tasks. + woshilaiceshide + 2014-07-23 11:05:41 -0700 + Commit: f776bc9, github.com/apache/spark/pull/1544 + + [SPARK-2609] Log thread ID when spilling ExternalAppendOnlyMap + Andrew Or + 2014-07-23 10:31:45 -0700 + Commit: 2592111, github.com/apache/spark/pull/1517 + + [SPARK-2617] Correct doc and usages of preservesPartitioning + Xiangrui Meng + 2014-07-23 00:58:55 -0700 + Commit: 4c7243e, github.com/apache/spark/pull/1526 + + Remove GraphX MessageToPartition for compatibility with sort-based shuffle + Ankur Dave + 2014-07-22 22:18:30 -0700 + Commit: 6c2be93, github.com/apache/spark/pull/1537 + + [YARN] SPARK-2577: File upload to viewfs is broken due to mount point re... + Gera Shegalov + 2014-07-22 21:05:12 -0500 + Commit: 02e4572, github.com/apache/spark/pull/1483 + + [YARN][SPARK-2606]:In some cases,the spark UI pages display incorrect + GuoQiang Li + 2014-07-22 20:34:40 -0500 + Commit: ddadf1b, github.com/apache/spark/pull/1501 + + Graphx example + CrazyJvm + 2014-07-22 18:14:44 -0700 + Commit: 5f7b991, github.com/apache/spark/pull/1523 + + [SPARK-2615] [SQL] Add Equal Sign "==" Support for HiveQl + Cheng Hao + 2014-07-22 18:13:28 -0700 + Commit: 79fe763, github.com/apache/spark/pull/1522 + + SPARK-2047: Introduce an in-mem Sorter, and use it to reduce mem usage + Aaron Davidson + 2014-07-22 11:58:53 -0700 + Commit: 85d3596, github.com/apache/spark/pull/1502 + + [MLLIB] make Mima ignore updateFeatures (private) in ALS + Xiangrui Meng + 2014-07-22 11:45:37 -0700 + Commit: 1407871, github.com/apache/spark/pull/1533 + + [SPARK-2612] [mllib] Fix data skew in ALS + peng.zhang + 2014-07-22 02:39:07 -0700 + Commit: 75db174, github.com/apache/spark/pull/1521 + + [SPARK-2452] Create a new valid for each instead of using lineId. + Prashant Sharma + 2014-07-22 00:38:26 -0700 + Commit: 81fec99, github.com/apache/spark/pull/1441 + + [SPARK-2470] PEP8 fixes to PySpark + Nicholas Chammas , nchammas + 2014-07-21 22:30:53 -0700 + Commit: 5d16d5b, github.com/apache/spark/pull/1505 + + [SPARK-2086] Improve output of toDebugString to make shuffle boundaries more clear + Gregory Owen + 2014-07-21 18:55:01 -0700 + Commit: c3462c6, github.com/apache/spark/pull/1364 + + [SPARK-2561][SQL] Fix apply schema + Michael Armbrust + 2014-07-21 18:18:17 -0700 + Commit: 511a731, github.com/apache/spark/pull/1470 + + [SPARK-2434][MLlib]: Warning messages that point users to original MLlib implementations added to Examples + Burak + 2014-07-21 17:03:40 -0700 + Commit: a4d6020, github.com/apache/spark/pull/1515 + + Fix flakey HiveQuerySuite test + Aaron Davidson + 2014-07-21 14:35:15 -0700 + Commit: abeacff, github.com/apache/spark/pull/1514 + + [SPARK-2494] [PySpark] make hash of None consistant cross machines + Davies Liu + 2014-07-21 11:59:54 -0700 + Commit: 872538c, github.com/apache/spark/pull/1371 + + SPARK-1707. Remove unnecessary 3 second sleep in YarnClusterScheduler + Sandy Ryza + 2014-07-21 13:15:46 -0500 + Commit: f89cf65, github.com/apache/spark/pull/634 + + [SPARK-2190][SQL] Specialized ColumnType for Timestamp + Cheng Lian + 2014-07-21 00:46:28 -0700 + Commit: cd273a2, github.com/apache/spark/pull/1440 + + [SPARK-1945][MLLIB] Documentation Improvements for Spark 1.0 + Michael Giannakopoulos + 2014-07-20 20:48:44 -0700 + Commit: db56f2d, github.com/apache/spark/pull/1311 + + Improve scheduler delay tooltip. + Kay Ousterhout + 2014-07-20 20:18:18 -0700 + Commit: f6e7302, github.com/apache/spark/pull/1488 + + [SPARK-2552][MLLIB] stabilize logistic function in pyspark + Xiangrui Meng + 2014-07-20 18:40:36 -0700 + Commit: b86db51, github.com/apache/spark/pull/1493 + + SPARK-2564. ShuffleReadMetrics.totalBlocksRead is redundant + Sandy Ryza + 2014-07-20 14:45:34 -0700 + Commit: 9564f85, github.com/apache/spark/pull/1474 + + [SPARK-2495][MLLIB] remove private[mllib] from linear models' constructors + Xiangrui Meng + 2014-07-20 13:04:59 -0700 + Commit: 1b10b81, github.com/apache/spark/pull/1492 + + [SPARK-2598] RangePartitioner's binary search does not use the given Ordering + Reynold Xin + 2014-07-20 11:06:06 -0700 + Commit: fa51b0f, github.com/apache/spark/pull/1500 + + SPARK-2519 part 2. Remove pattern matching on Tuple2 in critical section... + Sandy Ryza + 2014-07-20 01:24:32 -0700 + Commit: 98ab411, github.com/apache/spark/pull/1447 + + [SPARK-2524] missing document about spark.deploy.retainedDrivers + lianhuiwang , Wang Lianhui , unknown + 2014-07-19 20:46:59 -0700 + Commit: 4da01e3, github.com/apache/spark/pull/1443 + + SPARK-2587: Fix error message in make-distribution.sh + Mark Wagner + 2014-07-19 20:24:13 -0700 + Commit: c119498, github.com/apache/spark/pull/1489 + + Typo fix to the programming guide in the docs + Cesar Arevalo + 2014-07-19 20:20:07 -0700 + Commit: 0d01e85, github.com/apache/spark/pull/1495 + + SPARK-2596 HOTFIX: Deal with non-existent JIRAs. + Patrick Wendell + 2014-07-19 18:24:21 -0700 + Commit: d39e3b9 + + SPARK-2596 A tool for mirroring github pull requests on JIRA. + Patrick Wendell + 2014-07-19 18:19:08 -0700 + Commit: 49e4727, github.com/apache/spark/pull/1496 + + Revert "[SPARK-2521] Broadcast RDD object (instead of sending it along with every task)." + Reynold Xin + 2014-07-19 16:56:22 -0700 + Commit: 1efb369 + + SPARK-2407: Added Parser of SQL SUBSTR() + chutium + 2014-07-19 11:04:41 -0500 + Commit: 2a73211, github.com/apache/spark/pull/1442 + + put 'curRequestSize = 0' after 'logDebug' it + Lijie Xu + 2014-07-19 01:27:26 -0700 + Commit: 805f329, github.com/apache/spark/pull/1477 + + [SPARK-2521] Broadcast RDD object (instead of sending it along with every task). + Reynold Xin + 2014-07-18 23:52:47 -0700 + Commit: 7b8cd17, github.com/apache/spark/pull/1452 + + [SPARK-2359][MLlib] Correlations + Doris Xin + 2014-07-18 17:25:32 -0700 + Commit: a243364, github.com/apache/spark/pull/1367 + + [SPARK-2571] Correctly report shuffle read metrics. + Kay Ousterhout + 2014-07-18 14:40:32 -0700 + Commit: 7b971b9, github.com/apache/spark/pull/1476 + + [SPARK-2540] [SQL] Add HiveDecimal & HiveVarchar support in unwrapping data + Cheng Hao + 2014-07-18 16:38:11 -0500 + Commit: 7f17208, github.com/apache/spark/pull/1436 + + [SPARK-2535][SQL] Add StringComparison case to NullPropagation. + Takuya UESHIN + 2014-07-18 16:24:00 -0500 + Commit: 3a1709f, github.com/apache/spark/pull/1451 + + [MLlib] SPARK-1536: multiclass classification support for decision tree + Manish Amde , manishamde , Evan Sparks + 2014-07-18 14:00:13 -0700 + Commit: d88f6be, github.com/apache/spark/pull/886 + + Reservoir sampling implementation. + Reynold Xin + 2014-07-18 12:41:50 -0700 + Commit: 586e716, github.com/apache/spark/pull/1478 + + Added t2 instance types + Basit Mustafa + 2014-07-18 12:23:47 -0700 + Commit: 7f87ab9, github.com/apache/spark/pull/1446 + + SPARK-2553. Fix compile error + Sandy Ryza + 2014-07-18 00:47:43 -0700 + Commit: 30b8d36, github.com/apache/spark/pull/1479 + + SPARK-2553. CoGroupedRDD unnecessarily allocates a Tuple2 per dependency... + Sandy Ryza + 2014-07-17 23:57:08 -0700 + Commit: e52b871, github.com/apache/spark/pull/1461 + + [SPARK-2570] [SQL] Fix the bug of ClassCastException + Cheng Hao + 2014-07-17 23:25:01 -0700 + Commit: 29809a6, github.com/apache/spark/pull/1475 + + [SPARK-2411] Add a history-not-found page to standalone Master + Andrew Or + 2014-07-17 19:45:59 -0700 + Commit: 6afca2d, github.com/apache/spark/pull/1336 + + [SPARK-2299] Consolidate various stageIdTo* hash maps in JobProgressListener + Reynold Xin + 2014-07-17 18:58:48 -0700 + Commit: 72e9021, github.com/apache/spark/pull/1262 + + SPARK-1215 [MLLIB]: Clustering: Index out of bounds error (2) + Joseph K. Bradley + 2014-07-17 15:05:02 -0700 + Commit: 935fe65, github.com/apache/spark/pull/1468 + + SPARK-1478.2 Fix incorrect NioServerSocketChannelFactory constructor call + Sean Owen + 2014-07-17 12:20:48 -0700 + Commit: 1fcd5dc, github.com/apache/spark/pull/1466 + + [SPARK-2534] Avoid pulling in the entire RDD in various operators + Reynold Xin + 2014-07-17 10:54:53 -0700 + Commit: d988d34, github.com/apache/spark/pull/1450 + + [SPARK-2423] Clean up SparkSubmit for readability + Andrew Or + 2014-07-17 01:13:32 -0700 + Commit: 9c73822, github.com/apache/spark/pull/1349 + + SPARK-2526: Simplify options in make-distribution.sh + Patrick Wendell + 2014-07-17 01:02:35 -0700 + Commit: d0ea496, github.com/apache/spark/pull/1445 + + [SPARK-2412] CoalescedRDD throws exception with certain pref locs + Aaron Davidson + 2014-07-17 01:01:14 -0700 + Commit: 7c23c0d, github.com/apache/spark/pull/1337 + + [SPARK-2154] Schedule next Driver when one completes (standalone mode) + Aaron Davidson + 2014-07-16 14:16:48 -0700 + Commit: 9c24974, github.com/apache/spark/pull/1405 + + SPARK-1097: Do not introduce deadlock while fixing concurrency bug + Aaron Davidson + 2014-07-16 14:10:17 -0700 + Commit: 8867cd0, github.com/apache/spark/pull/1409 + + [SPARK-2317] Improve task logging. + Reynold Xin + 2014-07-16 11:50:49 -0700 + Commit: 7c8d123, github.com/apache/spark/pull/1259 + + fix compile error of streaming project + James Z.M. Gao + 2014-07-16 11:35:21 -0700 + Commit: caa163f, github.com/apache/spark/pull/153 + + [SPARK-2522] set default broadcast factory to torrent + Xiangrui Meng + 2014-07-16 11:27:51 -0700 + Commit: 96f28c9, github.com/apache/spark/pull/1437 + + [SPARK-2517] Remove some compiler warnings. + Reynold Xin + 2014-07-16 11:15:07 -0700 + Commit: ef48222, github.com/apache/spark/pull/1433 + + [SPARK-2518][SQL] Fix foldability of Substring expression. + Takuya UESHIN + 2014-07-16 11:13:38 -0700 + Commit: cc965ee, github.com/apache/spark/pull/1432 + + SPARK-2519. Eliminate pattern-matching on Tuple2 in performance-critical... + Sandy Ryza + 2014-07-16 11:07:16 -0700 + Commit: fc7edc9, github.com/apache/spark/pull/1435 + + [SQL] Cleaned up ConstantFolding slightly. + Reynold Xin + 2014-07-16 10:55:47 -0700 + Commit: 1c5739f, github.com/apache/spark/pull/1430 + + [SPARK-2525][SQL] Remove as many compilation warning messages as possible in Spark SQL + Yin Huai + 2014-07-16 10:53:59 -0700 + Commit: df95d82, github.com/apache/spark/pull/1444 + + Tightening visibility for various Broadcast related classes. + Reynold Xin + 2014-07-16 10:44:54 -0700 + Commit: efe2a8b, github.com/apache/spark/pull/1438 + + SPARK-2277: make TaskScheduler track hosts on rack + Rui Li + 2014-07-16 22:53:37 +0530 + Commit: 33e64ec, github.com/apache/spark/pull/1212 + + [SPARK-2119][SQL] Improved Parquet performance when reading off S3 + Cheng Lian + 2014-07-16 12:44:51 -0400 + Commit: efc452a, github.com/apache/spark/pull/1370 + + [SPARK-2504][SQL] Fix nullability of Substring expression. + Takuya UESHIN + 2014-07-15 22:43:48 -0700 + Commit: 632fb3d, github.com/apache/spark/pull/1426 + + [SPARK-2509][SQL] Add optimization for Substring. + Takuya UESHIN + 2014-07-15 22:35:34 -0700 + Commit: 9b38b7c, github.com/apache/spark/pull/1428 + + [SPARK-2314][SQL] Override collect and take in JavaSchemaRDD, forwarding to SchemaRDD implementations. + Aaron Staple + 2014-07-15 21:35:36 -0700 + Commit: 90ca532, github.com/apache/spark/pull/1421 + + follow pep8 None should be compared using is or is not + Ken Takagiwa + 2014-07-15 21:34:05 -0700 + Commit: 563acf5, github.com/apache/spark/pull/1422 + + [SPARK-2500] Move the logInfo for registering BlockManager to BlockManagerMasterActor.register method + Henry Saputra + 2014-07-15 21:21:52 -0700 + Commit: 9c12de5, github.com/apache/spark/pull/1424 + + [SPARK-2469] Use Snappy (instead of LZF) for default shuffle compression codec + Reynold Xin + 2014-07-15 18:47:39 -0700 + Commit: 4576d80, github.com/apache/spark/pull/1415 + + [SPARK-2498] [SQL] Synchronize on a lock when using scala reflection inside data type objects. + Zongheng Yang + 2014-07-15 17:58:28 -0700 + Commit: c2048a5, github.com/apache/spark/pull/1423 + + [SQL] Attribute equality comparisons should be done by exprId. + Michael Armbrust + 2014-07-15 17:56:17 -0700 + Commit: 502f907, github.com/apache/spark/pull/1414 + + SPARK-2407: Added internal implementation of SQL SUBSTR() + William Benton + 2014-07-15 14:11:57 -0700 + Commit: 61de65b, github.com/apache/spark/pull/1359 + + [SPARK-2474][SQL] For a registered table in OverrideCatalog, the Analyzer failed to resolve references in the format of "tableName.fieldName" + Yin Huai + 2014-07-15 14:06:45 -0700 + Commit: 8af46d5, github.com/apache/spark/pull/1406 + + [SQL] Whitelist more Hive tests. + Michael Armbrust + 2014-07-15 14:04:01 -0700 + Commit: bcd0c30, github.com/apache/spark/pull/1396 + + [SPARK-2483][SQL] Fix parsing of repeated, nested data access. + Michael Armbrust + 2014-07-15 14:01:48 -0700 + Commit: 0f98ef1, github.com/apache/spark/pull/1411 + + [SPARK-2471] remove runtime scope for jets3t + Xiangrui Meng + 2014-07-15 14:00:54 -0700 + Commit: a21f9a7, github.com/apache/spark/pull/1402 + + Added LZ4 to compression codec in configuration page. + Reynold Xin + 2014-07-15 13:13:33 -0700 + Commit: e7ec815, github.com/apache/spark/pull/1417 + + SPARK-1291: Link the spark UI to RM ui in yarn-client mode + witgo + 2014-07-15 13:52:56 -0500 + Commit: 72ea56d, github.com/apache/spark/pull/1112 + + SPARK-2480: Resolve sbt warnings "NOTE: SPARK_YARN is deprecated, please use -Pyarn flag" + witgo + 2014-07-15 10:46:17 -0700 + Commit: 9dd635e, github.com/apache/spark/pull/1404 + + Reformat multi-line closure argument. + William Benton + 2014-07-15 09:13:39 -0700 + Commit: cb09e93, github.com/apache/spark/pull/1419 + + [MLLIB] [SPARK-2222] Add multiclass evaluation metrics + Alexander Ulanov , unknown , Xiangrui Meng + 2014-07-15 08:40:22 -0700 + Commit: 04b01bb, github.com/apache/spark/pull/1155 + + README update: added "for Big Data". + Reynold Xin + 2014-07-15 02:20:01 -0700 + Commit: 6555618 + + Update README.md to include a slightly more informative project description. + Reynold Xin + 2014-07-15 02:15:29 -0700 + Commit: 8f1d422 + + [SPARK-2477][MLlib] Using appendBias for adding intercept in GeneralizedLinearAlgorithm + DB Tsai + 2014-07-15 02:14:58 -0700 + Commit: 52beb20, github.com/apache/spark/pull/1410 + + [SPARK-2399] Add support for LZ4 compression. + Reynold Xin + 2014-07-15 01:46:57 -0700 + Commit: dd95aba, github.com/apache/spark/pull/1416 + + discarded exceeded completedDrivers + lianhuiwang + 2014-07-15 00:22:06 -0700 + Commit: 7446f5f, github.com/apache/spark/pull/1114 + + [SPARK-2485][SQL] Lock usage of hive client. + Michael Armbrust + 2014-07-15 00:13:51 -0700 + Commit: c7c7ac8, github.com/apache/spark/pull/1412 + + [SPARK-2390] Files in staging directory cannot be deleted and wastes the space of HDFS + Kousuke Saruta + 2014-07-14 23:55:39 -0700 + Commit: c6d7574, github.com/apache/spark/pull/1326 + + Add/increase severity of warning in documentation of groupBy() + Aaron Davidson + 2014-07-14 23:38:12 -0700 + Commit: a2aa7be, github.com/apache/spark/pull/1380 + + SPARK-2486: Utils.getCallSite is now resilient to bogus frames + William Benton + 2014-07-14 23:09:13 -0700 + Commit: 1f99fea, github.com/apache/spark/pull/1413 + + [SPARK-2467] Revert SparkBuild to publish-local to both .m2 and .ivy2. + Takuya UESHIN + 2014-07-14 23:06:35 -0700 + Commit: e2255e4, github.com/apache/spark/pull/1398 + + [SPARK-2446][SQL] Add BinaryType support to Parquet I/O. + Takuya UESHIN + 2014-07-14 15:42:28 -0700 + Commit: 9fe693b, github.com/apache/spark/pull/1373 + + [SPARK-1946] Submit tasks after (configured ratio) executors have been registered + li-zhihui + 2014-07-14 15:32:49 -0500 + Commit: 3dd8af7, github.com/apache/spark/pull/900 + + [SPARK-2443][SQL] Fix slow read from partitioned tables + Zongheng Yang + 2014-07-14 13:22:24 -0700 + Commit: d60b09b, github.com/apache/spark/pull/1408 + + move some test file to match src code + Daoyuan + 2014-07-14 10:40:44 -0700 + Commit: 38ccd6e, github.com/apache/spark/pull/1401 + + Made rdd.py pep8 complaint by using Autopep8 and a little manual editing. + Prashant Sharma + 2014-07-14 00:42:59 -0700 + Commit: aab5349, github.com/apache/spark/pull/1354 + + SPARK-2363. Clean MLlib's sample data files + Sean Owen + 2014-07-13 19:27:43 -0700 + Commit: 635888c, github.com/apache/spark/pull/1394 + + SPARK-2462. Make Vector.apply public. + Sandy Ryza + 2014-07-12 16:55:15 -0700 + Commit: 4c8be64, github.com/apache/spark/pull/1389 + + [SPARK-2405][SQL] Reusue same byte buffers when creating new instance of InMemoryRelation + Michael Armbrust + 2014-07-12 12:13:32 -0700 + Commit: 1a7d7cc, github.com/apache/spark/pull/1332 + + [SPARK-2441][SQL] Add more efficient distinct operator. + Michael Armbrust + 2014-07-12 12:07:27 -0700 + Commit: 7e26b57, github.com/apache/spark/pull/1366 + + [SPARK-2455] Mark (Shippable)VertexPartition serializable + Ankur Dave + 2014-07-12 12:05:34 -0700 + Commit: 7a01352, github.com/apache/spark/pull/1376 + + Use the Executor's ClassLoader in sc.objectFile(). + Daniel Darabos + 2014-07-12 00:07:42 -0700 + Commit: 2245c87, github.com/apache/spark/pull/181 + + use specialized axpy in RowMatrix for SVD + Li Pu , Xiangrui Meng , Li Pu + 2014-07-11 23:26:47 -0700 + Commit: d38887b, github.com/apache/spark/pull/1378 + + [SPARK-1969][MLlib] Online summarizer APIs for mean, variance, min, and max + DB Tsai + 2014-07-11 23:04:43 -0700 + Commit: 5596086, github.com/apache/spark/pull/955 + + [SPARK-2457] Inconsistent description in README about build option + Kousuke Saruta + 2014-07-11 21:10:26 -0700 + Commit: cbff187, github.com/apache/spark/pull/1382 + + [SPARK-2437] Rename MAVEN_PROFILES to SBT_MAVEN_PROFILES and add SBT_MAVEN_PROPERTIES + Prashant Sharma + 2014-07-11 11:52:35 -0700 + Commit: b23e9c3, github.com/apache/spark/pull/1374 + + [Minor] Remove unused val in Master + Andrew Or + 2014-07-11 00:21:16 -0700 + Commit: f4f46de, github.com/apache/spark/pull/1365 + + fix Graph partitionStrategy comment + CrazyJvm + 2014-07-11 00:02:24 -0700 + Commit: 282cca0, github.com/apache/spark/pull/1368 + + [SPARK-2358][MLLIB] Add an option to include native BLAS/LAPACK loader in the build + Xiangrui Meng + 2014-07-10 21:57:54 -0700 + Commit: 2f59ce7, github.com/apache/spark/pull/1295 + + [SPARK-2428][SQL] Add except and intersect methods to SchemaRDD. + Takuya UESHIN + 2014-07-10 19:27:24 -0700 + Commit: 10b59ba, github.com/apache/spark/pull/1355 + + [SPARK-2415] [SQL] RowWriteSupport should handle empty ArrayType correctly. + Takuya UESHIN + 2014-07-10 19:23:44 -0700 + Commit: f5abd27, github.com/apache/spark/pull/1339 + + [SPARK-2431][SQL] Refine StringComparison and related codes. + Takuya UESHIN + 2014-07-10 19:20:00 -0700 + Commit: f62c427, github.com/apache/spark/pull/1357 + + SPARK-2427: Fix Scala examples that use the wrong command line arguments index + Artjom-Metro , Artjom-Metro + 2014-07-10 16:03:30 -0700 + Commit: ae8ca4d, github.com/apache/spark/pull/1353 + + [SPARK-1341] [Streaming] Throttle BlockGenerator to limit rate of data consumption. + Issac Buenrostro + 2014-07-10 16:01:08 -0700 + Commit: 2dd6724, github.com/apache/spark/pull/945 + + [SPARK-1478].3: Upgrade FlumeInputDStream's FlumeReceiver to support FLUME-1915 + tmalaska , Tathagata Das + 2014-07-10 13:15:02 -0700 + Commit: 40a8fef, github.com/apache/spark/pull/1347 + + name ec2 instances and security groups consistently + Nicholas Chammas , nchammas + 2014-07-10 12:56:00 -0700 + Commit: 369aa84, github.com/apache/spark/pull/1344 + + HOTFIX: Minor doc update for sbt change + Patrick Wendell + 2014-07-10 11:10:43 -0700 + Commit: 88006a6 + + [SPARK-1776] Have Spark's SBT build read dependencies from Maven. + Prashant Sharma , Patrick Wendell + 2014-07-10 11:03:37 -0700 + Commit: 628932b, github.com/apache/spark/pull/772 + + SPARK-2115: Stage kill link is too close to stage details link + Masayoshi TSUZUKI + 2014-07-10 01:18:37 -0700 + Commit: c2babc0, github.com/apache/spark/pull/1350 + + Clean up SparkKMeans example's code + Raymond Liu + 2014-07-09 23:39:29 -0700 + Commit: 2b18ea9, github.com/apache/spark/pull/1352 + + HOTFIX: Remove persistently failing test in master. + Patrick Wendell + 2014-07-09 19:44:24 -0700 + Commit: 553c578 + + Revert "[HOTFIX] Synchronize on SQLContext.settings in tests." + Patrick Wendell + 2014-07-09 19:36:38 -0700 + Commit: dd22bc2 + + SPARK-2416: Allow richer reporting of unit test results + Patrick Wendell + 2014-07-09 19:26:16 -0700 + Commit: 2e0a037, github.com/apache/spark/pull/1340 + + SPARK-1782: svd for sparse matrix using ARPACK + Li Pu , Xiangrui Meng , Li Pu + 2014-07-09 12:15:08 -0700 + Commit: 1f33e1f, github.com/apache/spark/pull/964 + + [SPARK-2417][MLlib] Fix DecisionTree tests + johnnywalleye + 2014-07-09 11:06:34 -0700 + Commit: d35e3db, github.com/apache/spark/pull/1343 + + [STREAMING] SPARK-2343: Fix QueueInputDStream with oneAtATime false + Manuel Laflamme + 2014-07-09 10:45:45 -0700 + Commit: 0eb1152, github.com/apache/spark/pull/1285 + + [SPARK-2384] Add tooltips to UI. + Kay Ousterhout + 2014-07-08 22:57:21 -0700 + Commit: 339441f, github.com/apache/spark/pull/1314 + + [SPARK-2152][MLlib] fix bin offset in DecisionTree node aggregations (also resolves SPARK-2160) + johnnywalleye + 2014-07-08 19:17:26 -0700 + Commit: 1114207, github.com/apache/spark/pull/1316 + + [SPARK-2413] Upgrade junit_xml_listener to 0.5.1 + DB Tsai + 2014-07-08 17:50:36 -0700 + Commit: ac9cdc1, github.com/apache/spark/pull/1333 + + [SPARK-2392] Executors should not start their own HTTP servers + Andrew Or + 2014-07-08 17:35:31 -0700 + Commit: bf04a39, github.com/apache/spark/pull/1335 + + [SPARK-2362] Fix for newFilesOnly logic in file DStream + Gabriele Nizzoli + 2014-07-08 14:23:38 -0700 + Commit: e6f7bfc, github.com/apache/spark/pull/1077 + + [SPARK-2409] Make SQLConf thread safe. + Reynold Xin + 2014-07-08 14:00:47 -0700 + Commit: 32516f8, github.com/apache/spark/pull/1334 + + SPARK-2400 : fix spark.yarn.max.executor.failures explaination + CrazyJvm + 2014-07-08 13:55:42 -0500 + Commit: b520b64, github.com/apache/spark/pull/1282 + + [SPARK-2403] Catch all errors during serialization in DAGScheduler + Daniel Darabos + 2014-07-08 10:43:46 -0700 + Commit: c8a2313, github.com/apache/spark/pull/1329 + + [SPARK-2395][SQL] Optimize common LIKE patterns. + Michael Armbrust + 2014-07-08 10:36:18 -0700 + Commit: cc3e0a1, github.com/apache/spark/pull/1325 + + [EC2] Add default history server port to ec2 script + Andrew Or + 2014-07-08 16:49:31 +0900 + Commit: 56e009d, github.com/apache/spark/pull/1296 + + [SPARK-2391][SQL] Custom take() for LIMIT queries. + Michael Armbrust + 2014-07-08 00:41:46 -0700 + Commit: 5a40636, github.com/apache/spark/pull/1318 + + Resolve sbt warnings during build Ⅱ + witgo + 2014-07-08 00:31:42 -0700 + Commit: 3cd5029, github.com/apache/spark/pull/1153 + + Updated programming-guide.md + Rishi Verma + 2014-07-08 00:29:23 -0700 + Commit: 0128905, github.com/apache/spark/pull/1324 + + [SPARK-2235][SQL]Spark SQL basicOperator add Intersect operator + Yanjie Gao , YanjieGao <396154235@qq.com> + 2014-07-07 19:40:04 -0700 + Commit: 50561f4, github.com/apache/spark/pull/1150 + + [SPARK-2376][SQL] Selecting list values inside nested JSON objects raises java.lang.IllegalArgumentException + Yin Huai + 2014-07-07 18:37:38 -0700 + Commit: 4352a2f, github.com/apache/spark/pull/1320 + + [SPARK-2375][SQL] JSON schema inference may not resolve type conflicts correctly for a field inside an array of structs + Yin Huai + 2014-07-07 17:05:59 -0700 + Commit: f0496ee, github.com/apache/spark/pull/1308 + + [SPARK-2386] [SQL] RowWriteSupport should use the exact types to cast. + Takuya UESHIN + 2014-07-07 17:04:02 -0700 + Commit: 4deeed1, github.com/apache/spark/pull/1315 + + [SPARK-2339][SQL] SQL parser in sql-core is case sensitive, but a table alias is converted to lower case when we create Subquery + Yin Huai + 2014-07-07 17:01:44 -0700 + Commit: c0b4cf0, github.com/apache/spark/pull/1317 + + [SPARK-1977][MLLIB] register mutable BitSet in MovieLenseALS + Neville Li + 2014-07-07 15:06:14 -0700 + Commit: f7ce1b3, github.com/apache/spark/pull/1319 + + [SPARK-2327] [SQL] Fix nullabilities of Join/Generate/Aggregate. + Takuya UESHIN + 2014-07-05 11:51:48 -0700 + Commit: 9d5ecf8, github.com/apache/spark/pull/1266 + + [SPARK-2366] [SQL] Add column pruning for the right side of LeftSemi join. + Takuya UESHIN + 2014-07-05 11:48:08 -0700 + Commit: 3da8df9, github.com/apache/spark/pull/1301 + + [SPARK-2306]:BoundedPriorityQueue is private and not registered with Kry... + ankit.bhardwaj + 2014-07-04 22:06:10 -0700 + Commit: 42f3abd, github.com/apache/spark/pull/1299 + + [SPARK-2370][SQL] Decrease metadata retrieved for partitioned hive queries. + Michael Armbrust + 2014-07-04 19:15:48 -0700 + Commit: 9d006c9, github.com/apache/spark/pull/1305 + + Added SignalLogger to HistoryServer. + Reynold Xin + 2014-07-04 17:33:07 -0700 + Commit: 0db5d5a, github.com/apache/spark/pull/1300 + + HOTFIX: Clean before building docs during release. + Patrick Wendell + 2014-07-04 10:01:19 -0700 + Commit: fc71658 + + [SPARK-2234][SQL]Spark SQL basicOperators add Except operator + Yanjie Gao , YanjieGao <396154235@qq.com>, root , gaoyanjie + 2014-07-04 02:43:57 -0700 + Commit: 5dadda8, github.com/apache/spark/pull/1151 + + [SPARK-2059][SQL] Add analysis checks + Reynold Xin , Michael Armbrust + 2014-07-04 00:53:41 -0700 + Commit: b3e768e, github.com/apache/spark/pull/1265 + + Update SQLConf.scala + baishuo(白硕) + 2014-07-04 00:25:31 -0700 + Commit: 0bbe612, github.com/apache/spark/pull/1272 + + [SPARK-1199][REPL] Remove VALId and use the original import style for defined classes. + Prashant Sharma + 2014-07-04 00:05:27 -0700 + Commit: d434150, github.com/apache/spark/pull/1179 + + [SPARK-2059][SQL] Don't throw TreeNodeException in `execution.ExplainCommand` + Cheng Lian + 2014-07-03 23:41:54 -0700 + Commit: 5448804, github.com/apache/spark/pull/1294 + + SPARK-2282: Reuse PySpark Accumulator sockets to avoid crashing Spark + Aaron Davidson + 2014-07-03 23:02:36 -0700 + Commit: 97a0bfe, github.com/apache/spark/pull/1220 + + [SPARK-2307][Reprise] Correctly report RDD blocks on SparkUI + Andrew Or + 2014-07-03 22:48:23 -0700 + Commit: 3894a49, github.com/apache/spark/pull/1255 + + [SPARK-2350] Don't NPE while launching drivers + Aaron Davidson + 2014-07-03 22:31:41 -0700 + Commit: 586feb5, github.com/apache/spark/pull/1289 + + [SPARK-1097] Workaround Hadoop conf ConcurrentModification issue + Raymond Liu + 2014-07-03 19:24:22 -0700 + Commit: 5fa0a05, github.com/apache/spark/pull/1273 + + Streaming programming guide typos + Clément MATHIEU + 2014-07-03 18:31:18 -0700 + Commit: fdc4c11, github.com/apache/spark/pull/1286 + + [HOTFIX] Synchronize on SQLContext.settings in tests. + Zongheng Yang + 2014-07-03 17:37:53 -0700 + Commit: d4c30cd, github.com/apache/spark/pull/1277 + + [SPARK-2109] Setting SPARK_MEM for bin/pyspark does not work. + Prashant Sharma + 2014-07-03 15:06:58 -0700 + Commit: 731f683b, github.com/apache/spark/pull/1050 + + [SPARK-2342] Evaluation helper's output type doesn't conform to input ty... + Yijie Shen + 2014-07-03 13:22:13 -0700 + Commit: a9b52e5, github.com/apache/spark/pull/1283 + + SPARK-1675. Make clear whether computePrincipalComponents requires centered data + Sean Owen + 2014-07-03 11:54:51 -0700 + Commit: 2b36344, github.com/apache/spark/pull/1171 + + [SPARK] Fix NPE for ExternalAppendOnlyMap + Andrew Or + 2014-07-03 10:26:50 -0700 + Commit: c480537, github.com/apache/spark/pull/1288 + + [SPARK-2324] SparkContext should not exit directly when spark.local.dir is a list of multiple paths and one of them has error + yantangzhai + 2014-07-03 10:14:35 -0700 + Commit: 3bbeca6, github.com/apache/spark/pull/1274 + + [SPARK-2287] [SQL] Make ScalaReflection be able to handle Generic case classes. + Takuya UESHIN + 2014-07-02 10:10:36 -0700 + Commit: bc7041a, github.com/apache/spark/pull/1226 + + [SPARK-2328] [SQL] Add execution of `SHOW TABLES` before `TestHive.reset()`. + Takuya UESHIN + 2014-07-02 10:07:01 -0700 + Commit: 1e2c26c, github.com/apache/spark/pull/1268 + + SPARK-2186: Spark SQL DSL support for simple aggregations such as SUM and AVG + Ximo Guanter Gonzalbez + 2014-07-02 10:03:44 -0700 + Commit: 5c6ec94, github.com/apache/spark/pull/1211 + + update the comments in SqlParser + CodingCat + 2014-07-01 20:37:10 -0700 + Commit: 6596392, github.com/apache/spark/pull/1275 + + [SPARK-2185] Emit warning when task size exceeds a threshold. + Kay Ousterhout + 2014-07-01 01:56:51 -0700 + Commit: 05c3d90, github.com/apache/spark/pull/1149 + + SPARK-2332 [build] add exclusion for old servlet-api on hadoop-client in core + Peter MacKinnon + 2014-07-01 00:28:38 -0700 + Commit: 3319a3e, github.com/apache/spark/pull/1271 + + SPARK-2293. Replace RDD.zip usage by map with predict inside. + Sean Owen + 2014-06-30 16:03:38 -0700 + Commit: 04fa122, github.com/apache/spark/pull/1250 + + [SPARK-2318] When exiting on a signal, print the signal name first. + Reynold Xin + 2014-06-30 15:12:38 -0700 + Commit: 5fccb56, github.com/apache/spark/pull/1260 + + [SPARK-2322] Exception in resultHandler should NOT crash DAGScheduler and shutdown SparkContext. + Reynold Xin + 2014-06-30 11:50:22 -0700 + Commit: 358ae15, github.com/apache/spark/pull/1264 + + SPARK-2077 Log serializer that actually ends up being used + Andrew Ash + 2014-06-29 23:29:05 -0700 + Commit: 6803642, github.com/apache/spark/pull/1017 + + SPARK-897: preemptively serialize closures + William Benton + 2014-06-29 23:27:34 -0700 + Commit: a484030, github.com/apache/spark/pull/143 + + [SPARK-2104] Fix task serializing issues when sort with Java non serializable class + jerryshao + 2014-06-29 23:00:00 -0700 + Commit: 66135a3, github.com/apache/spark/pull/1245 + + [SPARK-1683] Track task read metrics. + Kay Ousterhout + 2014-06-29 22:01:42 -0700 + Commit: 7b71a0e, github.com/apache/spark/pull/962 + + [SPARK-2320] Reduce exception/code block font size in web ui + Reynold Xin + 2014-06-29 16:46:28 -0700 + Commit: cdf613f, github.com/apache/spark/pull/1261 + + Improve MapOutputTracker error logging. + Reynold Xin + 2014-06-28 21:05:03 -0700 + Commit: 2053d79, github.com/apache/spark/pull/1258 + + [SPARK-1394] Remove SIGCHLD handler in worker subprocess + Matthew Farrellee + 2014-06-28 18:39:27 -0700 + Commit: 3c104c7, github.com/apache/spark/pull/1247 + + [SPARK-2233] make-distribution script should list the git hash in the RELEASE file + Guillaume Ballet + 2014-06-28 13:07:12 -0700 + Commit: b8f2e13, github.com/apache/spark/pull/1216 + + [SPARK-2003] Fix python SparkContext example + Matthew Farrellee + 2014-06-27 18:20:33 -0700 + Commit: 0e0686d, github.com/apache/spark/pull/1246 + + [SPARK-2259] Fix highly misleading docs on cluster / client deploy modes + Andrew Or + 2014-06-27 16:11:31 -0700 + Commit: f17510e, github.com/apache/spark/pull/1200 + + [SPARK-2307] SparkUI - storage tab displays incorrect RDDs + Andrew Or + 2014-06-27 15:23:25 -0700 + Commit: 21e0f77, github.com/apache/spark/pull/1249 + + SPARK-2181:The keys for sorting the columns of Executor page in SparkUI are incorrect + witgo + 2014-06-26 21:59:21 -0700 + Commit: 18f29b9, github.com/apache/spark/pull/1135 + + [SPARK-2251] fix concurrency issues in random sampler + Xiangrui Meng + 2014-06-26 21:46:55 -0700 + Commit: c23f5db, github.com/apache/spark/pull/1229 + + [SPARK-2297][UI] Make task attempt and speculation more explicit in UI. + Reynold Xin + 2014-06-26 21:13:26 -0700 + Commit: d1636dd, github.com/apache/spark/pull/1236 + + Removed throwable field from FetchFailedException and added MetadataFetchFailedException + Reynold Xin + 2014-06-26 21:12:16 -0700 + Commit: bf578de, github.com/apache/spark/pull/1227 + + [SQL]Extract the joinkeys from join condition + Cheng Hao + 2014-06-26 19:18:11 -0700 + Commit: 981bde9, github.com/apache/spark/pull/1190 + + Strip '@' symbols when merging pull requests. + Patrick Wendell + 2014-06-26 17:09:24 -0700 + Commit: f1f7385, github.com/apache/spark/pull/1239 + + Fixing AWS instance type information based upon current EC2 data + Zichuan Ye + 2014-06-26 15:21:29 -0700 + Commit: 62d4a0f, github.com/apache/spark/pull/1156 + + [SPARK-2286][UI] Report exception/errors for failed tasks that are not ExceptionFailure + Reynold Xin + 2014-06-26 14:00:45 -0700 + Commit: 6587ef7, github.com/apache/spark/pull/1225 + + [SPARK-2295] [SQL] Make JavaBeans nullability stricter. + Takuya UESHIN + 2014-06-26 13:37:19 -0700 + Commit: 32a1ad7, github.com/apache/spark/pull/1235 + + Remove use of spark.worker.instances + Kay Ousterhout + 2014-06-26 08:20:27 -0500 + Commit: 48a82a8, github.com/apache/spark/pull/1214 + + [SPARK-2254] [SQL] ScalaRefection should mark primitive types as non-nullable. + Takuya UESHIN + 2014-06-25 23:55:31 -0700 + Commit: e4899a2, github.com/apache/spark/pull/1193 + + [SPARK-2172] PySpark cannot import mllib modules in YARN-client mode + Szul, Piotr + 2014-06-25 21:55:49 -0700 + Commit: 441cdcc, github.com/apache/spark/pull/1223 + + [SPARK-2284][UI] Mark all failed tasks as failures. + Reynold Xin + 2014-06-25 22:35:03 -0700 + Commit: 4a346e2, github.com/apache/spark/pull/1224 + + [SPARK-1749] Job cancellation when SchedulerBackend does not implement killTask + Mark Hamstra , Kay Ousterhout + 2014-06-25 20:57:48 -0700 + Commit: b88a59a, github.com/apache/spark/pull/1219 + + [SPARK-2283][SQL] Reset test environment before running PruningSuite + Cheng Lian + 2014-06-25 18:41:47 -0700 + Commit: 7f196b0, github.com/apache/spark/pull/1221 + + [SQL] SPARK-1800 Add broadcast hash join operator & associated hints. + Zongheng Yang , Michael Armbrust + 2014-06-25 18:06:33 -0700 + Commit: 9d824fe, github.com/apache/spark/pull/1163 + + [SPARK-2204] Launch tasks on the proper executors in mesos fine-grained mode + Sebastien Rainville + 2014-06-25 13:21:18 -0700 + Commit: 1132e47, github.com/apache/spark/pull/1140 + + [SPARK-2270] Kryo cannot serialize results returned by asJavaIterable + Reynold Xin + 2014-06-25 12:43:22 -0700 + Commit: 7ff2c75, github.com/apache/spark/pull/1206 + + [SPARK-2258 / 2266] Fix a few worker UI bugs + Andrew Or + 2014-06-25 12:23:08 -0700 + Commit: 9aa6032, github.com/apache/spark/pull/1213 + + [SPARK-2242] HOTFIX: pyspark shell hangs on simple job + Andrew Or + 2014-06-25 10:47:22 -0700 + Commit: 5603e4c, github.com/apache/spark/pull/1178 + + Replace doc reference to Shark with Spark SQL. + Reynold Xin + 2014-06-25 01:01:23 -0700 + Commit: ac06a85 + + SPARK-2038: rename "conf" parameters in the saveAsHadoop functions with source-compatibility + CodingCat + 2014-06-25 00:23:32 -0700 + Commit: acc01ab, github.com/apache/spark/pull/1137 + + [BUGFIX][SQL] Should match java.math.BigDecimal when wnrapping Hive output + Cheng Lian + 2014-06-25 00:17:28 -0700 + Commit: 22036ae, github.com/apache/spark/pull/1199 + + [SPARK-2263][SQL] Support inserting MAP to Hive tables + Cheng Lian + 2014-06-25 00:14:34 -0700 + Commit: 8fade89, github.com/apache/spark/pull/1205 + + SPARK-2248: spark.default.parallelism does not apply in local mode + witgo + 2014-06-24 19:44:37 -0700 + Commit: b6b4485, github.com/apache/spark/pull/1194 + + Fix possible null pointer in acumulator toString + Michael Armbrust + 2014-06-24 19:39:19 -0700 + Commit: 2714968, github.com/apache/spark/pull/1204 + + Autodetect JAVA_HOME on RPM-based systems + Matthew Farrellee + 2014-06-24 19:31:20 -0700 + Commit: 54055fb, github.com/apache/spark/pull/1185 + + [SQL]Add base row updating methods for JoinedRow + Cheng Hao + 2014-06-24 19:07:02 -0700 + Commit: 133495d, github.com/apache/spark/pull/1187 + + [SPARK-1112, 2156] Bootstrap to fetch the driver's Spark properties. + Xiangrui Meng + 2014-06-24 19:06:07 -0700 + Commit: 8ca4176, github.com/apache/spark/pull/1132 + + [SPARK-2264][SQL] Fix failing CachedTableSuite + Michael Armbrust + 2014-06-24 19:04:29 -0700 + Commit: a162c9b, github.com/apache/spark/pull/1201 + + Fix broken Json tests. + Kay Ousterhout + 2014-06-24 16:54:50 -0700 + Commit: 1978a90, github.com/apache/spark/pull/1198 + + HOTFIX: Disabling tests per SPARK-2264 + Patrick Wendell + 2014-06-24 15:09:30 -0700 + Commit: 221909e + + SPARK-1937: fix issue with task locality + Rui Li , lirui-intel + 2014-06-24 11:40:37 -0700 + Commit: 924b708, github.com/apache/spark/pull/892 + + [SPARK-2252] Fix MathJax for HTTPs. + Reynold Xin + 2014-06-23 23:18:47 -0700 + Commit: 420c1c3, github.com/apache/spark/pull/1189 + + [SPARK-2124] Move aggregation into shuffle implementations + jerryshao + 2014-06-23 20:25:46 -0700 + Commit: 56eb8af, github.com/apache/spark/pull/1064 + + [SPARK-2227] Support dfs command in SQL. + Reynold Xin + 2014-06-23 18:34:54 -0700 + Commit: 51c8168, github.com/apache/spark/pull/1167 + + Cleanup on Connection, ConnectionManagerId, ConnectionManager classes part 2 + Henry Saputra + 2014-06-23 17:13:26 -0700 + Commit: 383bf72, github.com/apache/spark/pull/1157 + + [SPARK-1768] History server enhancements. + Marcelo Vanzin + 2014-06-23 13:53:44 -0700 + Commit: 21ddd7d, github.com/apache/spark/pull/718 + + [SPARK-2118] spark class should complain if tools jar is missing. + Prashant Sharma + 2014-06-23 13:35:09 -0700 + Commit: 6dc6722, github.com/apache/spark/pull/1068 + + [SPARK-1669][SQL] Made cacheTable idempotent + Cheng Lian + 2014-06-23 13:24:33 -0700 + Commit: a4bc442, github.com/apache/spark/pull/1183 + + Fix mvn detection + Matthew Farrellee + 2014-06-23 11:24:05 -0700 + Commit: 853a2b9, github.com/apache/spark/pull/1181 + + Fixed small running on YARN docs typo + Vlad + 2014-06-23 10:55:49 -0500 + Commit: b88238f, github.com/apache/spark/pull/1158 + + [SPARK-1395] Fix "local:" URI support in Yarn mode (again). + Marcelo Vanzin + 2014-06-23 08:51:11 -0500 + Commit: e380767, github.com/apache/spark/pull/560 + + SPARK-2166 - Listing of instances to be terminated before the prompt + Jean-Martin Archer + 2014-06-22 20:52:02 -0700 + Commit: 9cb64b2, github.com/apache/spark/pull/270 + + SPARK-2241: quote command line args in ec2 script + Ori Kremer + 2014-06-22 20:21:23 -0700 + Commit: 9fc373e, github.com/apache/spark/pull/1169 + + SPARK-2229: FileAppender throw an llegalArgumentException in jdk6 + witgo + 2014-06-22 18:25:16 -0700 + Commit: 409d24e, github.com/apache/spark/pull/1174 + + SPARK-1316. Remove use of Commons IO + Sean Owen + 2014-06-22 11:47:49 -0700 + Commit: 9fe28c3, github.com/apache/spark/pull/1173 + + SPARK-2034. KafkaInputDStream doesn't close resources and may prevent JVM shutdown + Sean Owen + 2014-06-22 01:12:15 -0700 + Commit: 476581e, github.com/apache/spark/pull/980 + + SPARK-2231: dev/run-tests should include YARN and use a recent Hadoop version + Patrick Wendell + 2014-06-22 00:55:27 -0700 + Commit: 58b32f3, github.com/apache/spark/pull/1175 + + SPARK-1996. Remove use of special Maven repo for Akka + Sean Owen + 2014-06-21 23:29:57 -0700 + Commit: 1db9cbc, github.com/apache/spark/pull/1170 + + HOTFIX: Add excludes for new MIMA files + Patrick Wendell + 2014-06-21 15:20:15 -0700 + Commit: 3e0b078 + + HOTFIX: Fix missing MIMA ignore + Patrick Wendell + 2014-06-21 13:02:49 -0700 + Commit: 0a432d6 + + [SQL] Break hiveOperators.scala into multiple files. + Reynold Xin + 2014-06-21 12:04:18 -0700 + Commit: ec935ab, github.com/apache/spark/pull/1166 + + [SQL] Pass SQLContext instead of SparkContext into physical operators. + Reynold Xin + 2014-06-20 22:49:48 -0700 + Commit: ca5d8b5, github.com/apache/spark/pull/1164 + + Fix some tests. + Marcelo Vanzin + 2014-06-20 20:05:12 -0700 + Commit: 648553d, github.com/apache/spark/pull/917 + + [SPARK-2061] Made splits deprecated in JavaRDDLike + Anant + 2014-06-20 18:54:00 -0700 + Commit: 010c460, github.com/apache/spark/pull/1062 + + HOTFIX: Fixing style error introduced by 08d0ac + Patrick Wendell + 2014-06-20 18:44:54 -0700 + Commit: a678642 + + [SPARK-1970] Update unit test in XORShiftRandomSuite to use ChiSquareTest from commons-math3 + Doris Xin + 2014-06-20 18:42:02 -0700 + Commit: e99903b, github.com/apache/spark/pull/1073 + + SPARK-1902 Silence stacktrace from logs when doing port failover to port n+1 + Andrew Ash + 2014-06-20 18:25:33 -0700 + Commit: 08d0aca, github.com/apache/spark/pull/1019 + + [SQL] Use hive.SessionState, not the thread local SessionState + Aaron Davidson + 2014-06-20 17:55:54 -0700 + Commit: 2044784, github.com/apache/spark/pull/1148 + + Move ScriptTransformation into the appropriate place. + Reynold Xin + 2014-06-20 17:16:56 -0700 + Commit: d4c7572, github.com/apache/spark/pull/1162 + + Clean up CacheManager et al. + Andrew Or + 2014-06-20 17:14:33 -0700 + Commit: 01125a1, github.com/apache/spark/pull/1083 + + [SPARK-2225] Turn HAVING without GROUP BY into WHERE. + Reynold Xin + 2014-06-20 15:38:02 -0700 + Commit: 0ac71d1, github.com/apache/spark/pull/1161 + + SPARK-2180: support HAVING clauses in Hive queries + William Benton + 2014-06-20 13:41:38 -0700 + Commit: 171ebb3, github.com/apache/spark/pull/1136 + + SPARK-1868: Users should be allowed to cogroup at least 4 RDDs + Allan Douglas R. de Oliveira + 2014-06-20 11:03:03 -0700 + Commit: 6a224c3, github.com/apache/spark/pull/813 + + [SPARK-2163] class LBFGS optimize with Double tolerance instead of Int + Gang Bai + 2014-06-20 08:52:20 -0700 + Commit: d484dde, github.com/apache/spark/pull/1104 + + [SPARK-2218] rename Equals to EqualTo in Spark SQL expressions. + Reynold Xin + 2014-06-20 00:34:59 -0700 + Commit: 2f6a835, github.com/apache/spark/pull/1146 + + [SPARK-2196] [SQL] Fix nullability of CaseWhen. + Takuya UESHIN + 2014-06-20 00:12:52 -0700 + Commit: 3249528, github.com/apache/spark/pull/1133 + + SPARK-2203: PySpark defaults to use same num reduce partitions as map side + Aaron Davidson + 2014-06-20 00:06:57 -0700 + Commit: f46e02f, github.com/apache/spark/pull/1138 + + [SPARK-2209][SQL] Cast shouldn't do null check twice. + Reynold Xin + 2014-06-20 00:01:19 -0700 + Commit: c55bbb4, github.com/apache/spark/pull/1143 + + [SPARK-2210] cast to boolean on boolean value gets turned into NOT((boolean_condition) = 0) + Reynold Xin + 2014-06-19 23:58:23 -0700 + Commit: 6175640, github.com/apache/spark/pull/1144 + + SPARK-1293 [SQL] Parquet support for nested types + Andre Schumacher , Michael Armbrust + 2014-06-19 23:47:45 -0700 + Commit: f479cf3, github.com/apache/spark/pull/360 + + [SPARK-2177][SQL] describe table result contains only one column + Yin Huai + 2014-06-19 23:41:38 -0700 + Commit: f397e92, github.com/apache/spark/pull/1118 + + [SQL] Improve Speed of InsertIntoHiveTable + Michael Armbrust + 2014-06-19 23:39:03 -0700 + Commit: d3b7671, github.com/apache/spark/pull/1130 + + More minor scaladoc cleanup for Spark SQL. + Reynold Xin + 2014-06-19 22:34:21 -0700 + Commit: 278ec8a, github.com/apache/spark/pull/1142 + + HOTFIX: SPARK-2208 local metrics tests can fail on fast machines + Patrick Wendell + 2014-06-19 21:06:28 -0700 + Commit: e551479, github.com/apache/spark/pull/1141 + + A few minor Spark SQL Scaladoc fixes. + Reynold Xin + 2014-06-19 18:24:05 -0700 + Commit: 5464e79, github.com/apache/spark/pull/1139 + + [SPARK-2151] Recognize memory format for spark-submit + nravi + 2014-06-19 17:11:06 -0700 + Commit: f14b00a, github.com/apache/spark/pull/1095 + + [SPARK-2191][SQL] Make sure InsertIntoHiveTable doesn't execute more than once. + Michael Armbrust + 2014-06-19 14:14:03 -0700 + Commit: 777c595, github.com/apache/spark/pull/1129 + + [SPARK-2051]In yarn.ClientBase spark.yarn.dist.* do not work + witgo + 2014-06-19 12:11:26 -0500 + Commit: bce0897, github.com/apache/spark/pull/969 + + Minor fix + WangTao + 2014-06-18 23:24:57 -0700 + Commit: 67fca18, github.com/apache/spark/pull/1105 + + [SPARK-2187] Explain should not run the optimizer twice. + Reynold Xin + 2014-06-18 22:44:12 -0700 + Commit: 640c294, github.com/apache/spark/pull/1123 + + Squishing a typo bug before it causes real harm + Doris Xin + 2014-06-18 22:19:06 -0700 + Commit: 566f70f, github.com/apache/spark/pull/1125 + + [SPARK-2184][SQL] AddExchange isn't idempotent + Michael Armbrust + 2014-06-18 17:52:42 -0700 + Commit: 5ff75c7, github.com/apache/spark/pull/1122 + + Remove unicode operator from RDD.scala + Doris Xin + 2014-06-18 15:01:29 -0700 + Commit: 45a95f8, github.com/apache/spark/pull/1119 + + SPARK-2158 Clean up core/stdout file from FileAppenderSuite + Mark Hamstra + 2014-06-18 14:56:41 -0700 + Commit: 4cbeea8, github.com/apache/spark/pull/1100 + + [SPARK-1466] Raise exception if pyspark Gateway process doesn't start. + Kay Ousterhout + 2014-06-18 13:16:26 -0700 + Commit: 3870248, github.com/apache/spark/pull/383 + + Updated the comment for SPARK-2162. + Reynold Xin + 2014-06-18 12:48:58 -0700 + Commit: dd96fcd, github.com/apache/spark/pull/1117 + + [SPARK-2162] Double check in doGetLocal to avoid read on removed block. + Raymond Liu + 2014-06-18 10:57:45 -0700 + Commit: 5ad5e34, github.com/apache/spark/pull/1103 + + [SPARK-2176][SQL] Extra unnecessary exchange operator in the result of an explain command + Yin Huai + 2014-06-18 10:51:32 -0700 + Commit: 587d320, github.com/apache/spark/pull/1116 + + [STREAMING] SPARK-2009 Key not found exception when slow receiver starts + Vadim Chekan + 2014-06-17 22:03:50 -0700 + Commit: 889f7b7, github.com/apache/spark/pull/961 + + Revert "SPARK-2038: rename "conf" parameters in the saveAsHadoop functions" + Patrick Wendell + 2014-06-17 19:34:17 -0700 + Commit: 9e4b4bd + + [SPARK-2060][SQL] Querying JSON Datasets with SQL and DSL in Spark SQL + Yin Huai + 2014-06-17 19:14:59 -0700 + Commit: d2f4f30, github.com/apache/spark/pull/999 + + HOTFIX: bug caused by #941 + Patrick Wendell + 2014-06-17 15:09:24 -0700 + Commit: b2ebf42, github.com/apache/spark/pull/1108 + + [SPARK-2147 / 2161] Show removed executors on the UI + Andrew Or + 2014-06-17 12:25:55 -0700 + Commit: a14807e, github.com/apache/spark/pull/1102 + + SPARK-2038: rename "conf" parameters in the saveAsHadoop functions + CodingCat + 2014-06-17 12:17:48 -0700 + Commit: 443f5e1, github.com/apache/spark/pull/1087 + + SPARK-2146. Fix takeOrdered doc + Sandy Ryza + 2014-06-17 12:03:22 -0700 + Commit: 2794990, github.com/apache/spark/pull/1086 + + SPARK-1063 Add .sortBy(f) method on RDD + Andrew Ash + 2014-06-17 11:47:48 -0700 + Commit: b92d16b, github.com/apache/spark/pull/369 + + [SPARK-2053][SQL] Add Catalyst expressions for CASE WHEN. + Zongheng Yang + 2014-06-17 13:30:17 +0200 + Commit: e243c5f, github.com/apache/spark/pull/1055 + + [SPARK-2164][SQL] Allow Hive UDF on columns of type struct + Xi Liu + 2014-06-17 13:14:40 +0200 + Commit: f5a4049, github.com/apache/spark/pull/796 + + [SPARK-2144] ExecutorsPage reports incorrect # of RDD blocks + Andrew Or + 2014-06-17 01:28:22 -0700 + Commit: 09deb3e, github.com/apache/spark/pull/1080 + + SPARK-2035: Store call stack for stages, display it on the UI. + Daniel Darabos , Patrick Wendell + 2014-06-17 00:08:05 -0700 + Commit: 23a12ce, github.com/apache/spark/pull/981 + + SPARK-1990: added compatibility for python 2.6 for ssh_read command + Anant + 2014-06-16 23:42:27 -0700 + Commit: 8cd04c3, github.com/apache/spark/pull/941 + + [SPARK-2130] End-user friendly String repr for StorageLevel in Python + Kan Zhang + 2014-06-16 23:31:31 -0700 + Commit: d81c08b, github.com/apache/spark/pull/1096 + + MLlib documentation fix + Anatoli Fomenko + 2014-06-16 23:10:36 -0700 + Commit: 7afa912, github.com/apache/spark/pull/1098 + + Minor fix: made "EXPLAIN" output to play well with JDBC output format + Cheng Lian + 2014-06-16 16:42:17 -0700 + Commit: 237b96b, github.com/apache/spark/pull/1097 + + [SQL][SPARK-2094] Follow up of PR #1071 for Java API + Cheng Lian + 2014-06-16 21:30:29 +0200 + Commit: 273afcb, github.com/apache/spark/pull/1085 + + [SPARK-1930] The Container is running beyond physical memory limits, so as to be killed + witgo + 2014-06-16 14:27:31 -0500 + Commit: cdf2b04, github.com/apache/spark/pull/894 + + [SPARK-2010] Support for nested data in PySpark SQL + Kan Zhang + 2014-06-16 11:11:29 -0700 + Commit: 4fdb491, github.com/apache/spark/pull/1041 + + SPARK-2039: apply output dir existence checking for all output formats + CodingCat + 2014-06-15 23:47:58 -0700 + Commit: 716c88a, github.com/apache/spark/pull/1088 + + Updating docs to include missing information about reducers and clarify ... + Ali Ghodsi + 2014-06-15 23:44:30 -0700 + Commit: 119b06a, github.com/apache/spark/pull/1089 + + SPARK-2148 Add link to requirements for custom equals() and hashcode() methods + Andrew Ash + 2014-06-15 23:32:55 -0700 + Commit: 9672ee0, github.com/apache/spark/pull/1092 + + SPARK-1999: StorageLevel in storage tab and RDD Storage Info never changes + CrazyJvm + 2014-06-15 23:23:26 -0700 + Commit: a63aa1a, github.com/apache/spark/pull/968 + + [SPARK-937] adding EXITED executor state and not relaunching cleanly exited executors + Kan Zhang + 2014-06-15 14:55:34 -0700 + Commit: ca5d9d4, github.com/apache/spark/pull/306 + + [SQL] Support transforming TreeNodes with Option children. + Michael Armbrust , Zongheng Yang + 2014-06-15 11:28:34 +0200 + Commit: 269fc62, github.com/apache/spark/pull/1074 + + [SPARK-1837] NumericRange should be partitioned in the same way as other... + Kan Zhang + 2014-06-14 14:31:28 -0700 + Commit: 7dd9fc6, github.com/apache/spark/pull/776 + + [SPARK-2013] Documentation for saveAsPickleFile and pickleFile in Python + Kan Zhang + 2014-06-14 13:22:30 -0700 + Commit: b52603b, github.com/apache/spark/pull/983 + + [SPARK-2079] Support batching when serializing SchemaRDD to Python + Kan Zhang + 2014-06-14 13:17:22 -0700 + Commit: 2550533, github.com/apache/spark/pull/1023 + + [Spark-2137][SQL] Timestamp UDFs broken + Yin Huai + 2014-06-13 23:28:57 -0700 + Commit: 8919685, github.com/apache/spark/pull/1081 + + Small correction in Streaming Programming Guide doc + akkomar + 2014-06-13 15:37:26 -0700 + Commit: edb1f0e, github.com/apache/spark/pull/1079 + + [SPARK-2094][SQL] "Exactly once" semantics for DDL and command statements + Cheng Lian + 2014-06-13 12:59:48 -0700 + Commit: ac96d96, github.com/apache/spark/pull/1071 + + [SPARK-1964][SQL] Add timestamp to HiveMetastoreTypes.toMetastoreType + Michael Armbrust + 2014-06-13 12:55:15 -0700 + Commit: 1c2fd01, github.com/apache/spark/pull/1061 + + Workaround in Spark for ConcurrentModification issue (JIRA Hadoop-10456, Spark-1097) + nravi + 2014-06-13 10:52:21 -0700 + Commit: 70c8116, github.com/apache/spark/pull/1000 + + [HOTFIX] add math3 version to pom + Xiangrui Meng + 2014-06-13 02:59:38 -0700 + Commit: b3736e3, github.com/apache/spark/pull/1075 + + [SPARK-2135][SQL] Use planner for in-memory scans + Michael Armbrust + 2014-06-12 23:09:41 -0700 + Commit: 13f8cfd, github.com/apache/spark/pull/1072 + + [SPARK-1516]Throw exception in yarn client instead of run system.exit directly. + John Zhao + 2014-06-12 21:39:00 -0700 + Commit: f95ac68, github.com/apache/spark/pull/490 + + [Minor] Fix style, formatting and naming in BlockManager etc. + Andrew Or + 2014-06-12 20:40:58 -0700 + Commit: 44daec5, github.com/apache/spark/pull/1058 + + SPARK-1939 Refactor takeSample method in RDD to use ScaSRS + Doris Xin , dorx , Xiangrui Meng + 2014-06-12 19:44:27 -0700 + Commit: 1de1d70, github.com/apache/spark/pull/916 + + document laziness of parallelize + Ariel Rabkin + 2014-06-12 17:51:33 -0700 + Commit: 0154587, github.com/apache/spark/pull/1070 + + SPARK-2085: [MLlib] Apply user-specific regularization instead of uniform regularization in ALS + Shuo Xiang + 2014-06-12 17:37:06 -0700 + Commit: a6e0afd, github.com/apache/spark/pull/1026 + + SPARK-1843: Replace assemble-deps with env variable. + Patrick Wendell + 2014-06-12 15:43:32 -0700 + Commit: 1c04652, github.com/apache/spark/pull/877 + + [SPARK-2080] Yarn: report HS URL in client mode, correct user in cluster mode. + Marcelo Vanzin + 2014-06-12 16:19:36 -0500 + Commit: ecde5b8, github.com/apache/spark/pull/1002 + + [SPARK-2088] fix NPE in toString + Doris Xin + 2014-06-12 12:53:07 -0700 + Commit: 83c226d, github.com/apache/spark/pull/1028 + + SPARK-554. Add aggregateByKey. + Sandy Ryza + 2014-06-12 08:14:25 -0700 + Commit: ce92a9c, github.com/apache/spark/pull/705 + + fixed typo in docstring for min() + Jeff Thompson + 2014-06-12 08:10:51 -0700 + Commit: 43d53d5, github.com/apache/spark/pull/1065 + + Cleanup on Connection and ConnectionManager + Henry Saputra + 2014-06-11 23:17:51 -0700 + Commit: 4d8ae70, github.com/apache/spark/pull/1060 + + 'killFuture' is never used + Yadong + 2014-06-11 20:58:39 -0700 + Commit: e056320, github.com/apache/spark/pull/1052 + + [SPARK-2044] Pluggable interface for shuffles + Matei Zaharia + 2014-06-11 20:45:29 -0700 + Commit: 508fd37, github.com/apache/spark/pull/1009 + + [SPARK-1672][MLLIB] Separate user and product partitioning in ALS + Tor Myklebust , Xiangrui Meng + 2014-06-11 18:16:33 -0700 + Commit: d920335, github.com/apache/spark/pull/1014 + + [SPARK-2052] [SQL] Add optimization for CaseConversionExpression's. + Takuya UESHIN + 2014-06-11 17:58:35 -0700 + Commit: 9a2448d, github.com/apache/spark/pull/990 + + HOTFIX: Forgot to remove false change in previous commit + Patrick Wendell + 2014-06-11 15:55:41 -0700 + Commit: d45e0c6 + + HOTFIX: PySpark tests should be order insensitive. + Patrick Wendell + 2014-06-11 15:54:41 -0700 + Commit: 14e6dc9, github.com/apache/spark/pull/1054 + + HOTFIX: A few PySpark tests were not actually run + Andrew Or + 2014-06-11 12:11:46 -0700 + Commit: fe78b8b, github.com/apache/spark/pull/1053 + + [SQL] Code Cleanup: Left Semi Hash Join + Daoyuan + 2014-06-11 12:08:28 -0700 + Commit: ce6deb1, github.com/apache/spark/pull/1049 + + [SPARK-2042] Prevent unnecessary shuffle triggered by take() + Sameer Agarwal + 2014-06-11 12:01:04 -0700 + Commit: 4107cce, github.com/apache/spark/pull/1048 + + SPARK-2113: awaitTermination() after stop() will hang in Spark Stremaing + Lars Albertsson + 2014-06-11 10:54:42 -0700 + Commit: 4d5c12a, github.com/apache/spark/pull/1001 + + [SPARK-2108] Mark SparkContext methods that return block information as developer API's + Prashant Sharma + 2014-06-11 10:49:34 -0700 + Commit: e508f59, github.com/apache/spark/pull/1047 + + [SPARK-2069] MIMA false positives + Prashant Sharma + 2014-06-11 10:47:06 -0700 + Commit: 5b754b4, github.com/apache/spark/pull/1021 + + SPARK-1639. Tidy up some Spark on YARN code + Sandy Ryza + 2014-06-11 07:57:28 -0500 + Commit: 2a4225d, github.com/apache/spark/pull/561 + + SPARK-2107: FilterPushdownSuite doesn't need Junit jar. + Qiuzhuang.Lian + 2014-06-11 00:36:06 -0700 + Commit: 6e11930, github.com/apache/spark/pull/1046 + + [SPARK-2091][MLLIB] use numpy.dot instead of ndarray.dot + Xiangrui Meng + 2014-06-11 00:22:40 -0700 + Commit: 0f1dc3a, github.com/apache/spark/pull/1035 + + [SPARK-1968][SQL] SQL/HiveQL command for caching/uncaching tables + Cheng Lian + 2014-06-11 00:06:50 -0700 + Commit: 0266a0c, github.com/apache/spark/pull/1038 + + [SPARK-2093] [SQL] NullPropagation should use exact type value. + Takuya UESHIN + 2014-06-10 23:13:48 -0700 + Commit: 0402bd7, github.com/apache/spark/pull/1034 + + HOTFIX: clear() configs in SQLConf-related unit tests. + Zongheng Yang + 2014-06-10 21:59:01 -0700 + Commit: 601032f, github.com/apache/spark/pull/1040 + + [SPARK-2065] give launched instances names + Nicholas Chammas , nchammas + 2014-06-10 21:49:08 -0700 + Commit: a2052a4, github.com/apache/spark/pull/1043 + + Resolve scalatest warnings during build + witgo + 2014-06-10 20:24:05 -0700 + Commit: c48b622, github.com/apache/spark/pull/1032 + + [SPARK-1940] Enabling rolling of executor logs, and automatic cleanup of old executor logs + Tathagata Das + 2014-06-10 20:22:02 -0700 + Commit: 4823bf4, github.com/apache/spark/pull/895 + + [SPARK-1998] SparkFlumeEvent with body bigger than 1020 bytes are not re... + joyyoj + 2014-06-10 17:26:17 -0700 + Commit: 2966044, github.com/apache/spark/pull/951 + + [SQL] Add average overflow test case from #978 + egraldlo , Michael Armbrust + 2014-06-10 14:07:55 -0700 + Commit: 1abbde0, github.com/apache/spark/pull/1033 + + HOTFIX: Increase time limit for Bagel test + Ankur Dave + 2014-06-10 13:15:06 -0700 + Commit: 55a0e87, github.com/apache/spark/pull/1037 + + HOTFIX: Fix Python tests on Jenkins. + Patrick Wendell + 2014-06-10 13:13:17 -0700 + Commit: fb499be, github.com/apache/spark/pull/1036 + + [SPARK-2076][SQL] Pushdown the join filter & predication for outer join + Cheng Hao + 2014-06-10 12:59:52 -0700 + Commit: db0c038, github.com/apache/spark/pull/1015 + + [SPARK-1978] In some cases, spark-yarn does not automatically restart the failed container + witgo + 2014-06-10 10:34:57 -0500 + Commit: 884ca71, github.com/apache/spark/pull/921 + + Moved hiveOperators.scala to the right package folder + Cheng Lian + 2014-06-10 01:14:44 -0700 + Commit: a9a461c, github.com/apache/spark/pull/1029 + + [SPARK-1508][SQL] Add SQLConf to SQLContext. + Zongheng Yang + 2014-06-10 00:49:09 -0700 + Commit: 08ed9ad, github.com/apache/spark/pull/956 + + SPARK-1416: PySpark support for SequenceFile and Hadoop InputFormats + Nick Pentreath + 2014-06-09 22:21:03 -0700 + Commit: f971d6c, github.com/apache/spark/pull/455 + + Make sure that empty string is filtered out when we get the secondary jars from conf + DB Tsai + 2014-06-09 22:18:50 -0700 + Commit: 6f2db8c, github.com/apache/spark/pull/1027 + + [SPARK-1704][SQL] Fully support EXPLAIN commands as SchemaRDD. + Zongheng Yang + 2014-06-09 16:47:44 -0700 + Commit: a9ec033, github.com/apache/spark/pull/1003 + + [SQL] Simple framework for debugging query execution + Michael Armbrust + 2014-06-09 14:24:19 -0700 + Commit: c6e041d, github.com/apache/spark/pull/1005 + + [SPARK-1522] : YARN ClientBase throws a NPE if there is no YARN Application CP + Bernardo Gomez Palacio + 2014-06-09 16:14:54 -0500 + Commit: e273447, github.com/apache/spark/pull/433 + + Added a TaskSetManager unit test. + Kay Ousterhout + 2014-06-09 13:13:53 -0700 + Commit: 6cf335d, github.com/apache/spark/pull/1024 + + [SPARK-1495][SQL]add support for left semi join + Daoyuan , Michael Armbrust , Daoyuan Wang + 2014-06-09 11:31:36 -0700 + Commit: 0cf6002, github.com/apache/spark/pull/837 + + SPARK-1944 Document --verbose in spark-shell -h + Andrew Ash + 2014-06-09 10:21:21 -0700 + Commit: 35630c8, github.com/apache/spark/pull/1020 + + [SPARK-1308] Add getNumPartitions to pyspark RDD + Syed Hashmi + 2014-06-09 00:08:40 -0700 + Commit: 6113ac1, github.com/apache/spark/pull/995 + + Grammar: read -> reads + Andrew Ash + 2014-06-08 23:20:10 -0700 + Commit: 32ee9f0, github.com/apache/spark/pull/1016 + + [SPARK-2067] use relative path for Spark logo in UI + Neville Li + 2014-06-08 23:18:27 -0700 + Commit: 15ddbef, github.com/apache/spark/pull/1006 + + SPARK-1628 follow up: Improve RangePartitioner's documentation. + Reynold Xin + 2014-06-08 18:39:57 -0700 + Commit: 219dc00, github.com/apache/spark/pull/1012 + + Update run-example + maji2014 + 2014-06-08 15:14:27 -0700 + Commit: e9261d0, github.com/apache/spark/pull/1011 + + SPARK-1628: Add missing hashCode methods in Partitioner subclasses + zsxwing + 2014-06-08 14:18:52 -0700 + Commit: a71c6d1, github.com/apache/spark/pull/549 + + SPARK-1898: In deploy.yarn.Client, use YarnClient not YarnClientImpl + Colin Patrick McCabe + 2014-06-08 12:27:34 -0700 + Commit: ee96e94, github.com/apache/spark/pull/850 + + SPARK-2026: Maven Hadoop Profiles Should Set The Hadoop Version + Bernardo Gomez Palacio + 2014-06-08 01:24:52 -0700 + Commit: a338834, github.com/apache/spark/pull/998 + + SPARK-2056 Set RDD name to input path + Neville Li + 2014-06-07 16:22:26 -0700 + Commit: 7b877b2, github.com/apache/spark/pull/992 + + HOTFIX: Support empty body in merge script + Patrick Wendell + 2014-06-07 16:16:37 -0700 + Commit: 3ace10d, github.com/apache/spark/pull/1007 + + [SPARK-1994][SQL] Weird data corruption bug when running Spark SQL on data in HDFS + Michael Armbrust + 2014-06-07 14:20:33 -0700 + Commit: a6c72ab, github.com/apache/spark/pull/1004 + + [SPARK-1841]: update scalatest to version 2.1.5 + witgo + 2014-06-06 11:45:21 -0700 + Commit: 41c4a33, github.com/apache/spark/pull/713 + + [SPARK-2050 - 2][SQL] DIV and BETWEEN should not be case sensitive. + Michael Armbrust + 2014-06-06 11:31:37 -0700 + Commit: 8d21056, github.com/apache/spark/pull/994 + + [SPARK-1552] Fix type comparison bug in {map,outerJoin}Vertices + Ankur Dave + 2014-06-05 23:33:12 -0700 + Commit: 8d85359, github.com/apache/spark/pull/967 + + [SPARK-2050][SQL] LIKE, RLIKE and IN in HQL should not be case sensitive. + Michael Armbrust + 2014-06-05 23:20:59 -0700 + Commit: 41db44c, github.com/apache/spark/pull/989 + + SPARK-2043: ExternalAppendOnlyMap doesn't always find matching keys + Matei Zaharia + 2014-06-05 23:01:48 -0700 + Commit: b45c13e, github.com/apache/spark/pull/986 + + [SPARK-2025] Unpersist edges of previous graph in Pregel + Ankur Dave + 2014-06-05 17:45:38 -0700 + Commit: 9bad0b7, github.com/apache/spark/pull/972 + + Use pluggable clock in DAGSheduler #SPARK-2031 + CrazyJvm + 2014-06-05 17:44:46 -0700 + Commit: 3d3f8c8, github.com/apache/spark/pull/976 + + [SPARK-2041][SQL] Correctly analyze queries where columnName == tableName. + Michael Armbrust + 2014-06-05 17:42:08 -0700 + Commit: c7a183b, github.com/apache/spark/pull/985 + + Remove compile-scoped junit dependency. + Marcelo Vanzin + 2014-06-05 13:13:33 -0700 + Commit: 668cb1d, github.com/apache/spark/pull/794 + + sbt 0.13.X should be using sbt-assembly 0.11.X + Kalpit Shah + 2014-06-05 13:07:26 -0700 + Commit: 5473aa7, github.com/apache/spark/pull/555 + + HOTFIX: Remove generated-mima-excludes file after runing MIMA. + Patrick Wendell + 2014-06-05 13:06:46 -0700 + Commit: f6143f1, github.com/apache/spark/pull/971 + + [SPARK-2036] [SQL] CaseConversionExpression should check if the evaluated value is null. + Takuya UESHIN + 2014-06-05 12:00:31 -0700 + Commit: e4c11ee, github.com/apache/spark/pull/982 + + SPARK-1677: allow user to disable output dir existence checking + CodingCat + 2014-06-05 11:39:35 -0700 + Commit: 89cdbb0, github.com/apache/spark/pull/947 + + [SPARK-2029] Bump pom.xml version number of master branch to 1.1.0-SNAPSHOT. + Takuya UESHIN + 2014-06-05 11:27:33 -0700 + Commit: 7c16029, github.com/apache/spark/pull/974 + + Fix issue in ReplSuite with hadoop-provided profile. + Marcelo Vanzin + 2014-06-04 22:56:49 -0700 + Commit: b77c19b, github.com/apache/spark/pull/781 + + Minor: Fix documentation error from apache/spark#946 + Ankur Dave + 2014-06-04 16:45:53 -0700 + Commit: abea2d4, github.com/apache/spark/pull/970 + + SPARK-1790: Update EC2 scripts to support r3 instance types + Varakhedi Sujeet + 2014-06-04 16:01:56 -0700 + Commit: 11ded3f, github.com/apache/spark/pull/960 + + SPARK-1518: FileLogger: Fix compile against Hadoop trunk + Colin McCabe + 2014-06-04 15:56:29 -0700 + Commit: 1765c8d, github.com/apache/spark/pull/898 + + [SPARK-1752][MLLIB] Standardize text format for vectors and labeled points + Xiangrui Meng + 2014-06-04 12:56:56 -0700 + Commit: 189df16, github.com/apache/spark/pull/685 + + SPARK-1973. Add randomSplit to JavaRDD (with tests, and tidy Java tests) + Sean Owen , Xiangrui Meng + 2014-06-04 11:27:08 -0700 + Commit: d341b17, github.com/apache/spark/pull/919 + + [MLLIB] set RDD names in ALS + Neville Li + 2014-06-04 01:51:34 -0700 + Commit: b8d2580, github.com/apache/spark/pull/966 + + [SPARK-1817] RDD.zip() should verify partition sizes for each partition + Kan Zhang + 2014-06-03 22:47:18 -0700 + Commit: c402a4a, github.com/apache/spark/pull/944 + + SPARK-1806 (addendum) Use non-deprecated methods in Mesos 0.18 + Sean Owen + 2014-06-03 22:37:20 -0700 + Commit: 4ca0625, github.com/apache/spark/pull/920 + + Update spark-ec2 scripts for 1.0.0 on master + Aaron Davidson + 2014-06-03 22:33:04 -0700 + Commit: ab7c62d, github.com/apache/spark/pull/938 + + Enable repartitioning of graph over different number of partitions + Joseph E. Gonzalez + 2014-06-03 20:49:14 -0700 + Commit: 5284ca7, github.com/apache/spark/pull/719 + + use env default python in merge_spark_pr.py + Xiangrui Meng + 2014-06-03 18:53:13 -0700 + Commit: e8d93ee, github.com/apache/spark/pull/965 + + SPARK-1941: Update streamlib to 2.7.0 and use HyperLogLogPlus instead of HyperLogLog. + Reynold Xin + 2014-06-03 18:37:40 -0700 + Commit: 1faef14, github.com/apache/spark/pull/897 + + [SPARK-1161] Add saveAsPickleFile and SparkContext.pickleFile in Python + Kan Zhang + 2014-06-03 18:18:25 -0700 + Commit: 21e40ed, github.com/apache/spark/pull/755 + + Fixed a typo + DB Tsai + 2014-06-03 18:10:58 -0700 + Commit: f4dd665, github.com/apache/spark/pull/959 + + [SPARK-1991] Support custom storage levels for vertices and edges + Ankur Dave + 2014-06-03 14:54:26 -0700 + Commit: b1feb60, github.com/apache/spark/pull/946 + + Synthetic GraphX Benchmark + Joseph E. Gonzalez , Ankur Dave + 2014-06-03 14:14:48 -0700 + Commit: 894ecde, github.com/apache/spark/pull/720 + + fix java.lang.ClassCastException + baishuo(白硕) + 2014-06-03 13:39:47 -0700 + Commit: aa41a52, github.com/apache/spark/pull/949 + + [SPARK-1468] Modify the partition function used by partitionBy. + Erik Selin + 2014-06-03 13:31:16 -0700 + Commit: 8edc9d0, github.com/apache/spark/pull/371 + + Add support for Pivotal HD in the Maven build: SPARK-1992 + tzolov + 2014-06-03 13:26:29 -0700 + Commit: b1f2853, github.com/apache/spark/pull/942 + + [SPARK-1912] fix compress memory issue during reduce + Wenchen Fan(Cloud) + 2014-06-03 13:18:20 -0700 + Commit: 45e9bc8, github.com/apache/spark/pull/860 + + SPARK-2001 : Remove docs/spark-debugger.md from master + Henry Saputra + 2014-06-03 13:03:51 -0700 + Commit: 6c044ed, github.com/apache/spark/pull/953 + + [SPARK-1942] Stop clearing spark.driver.port in unit tests + Syed Hashmi , CodingCat + 2014-06-03 12:04:47 -0700 + Commit: 7782a30, github.com/apache/spark/pull/943 + + Avoid dynamic dispatching when unwrapping Hive data. + Cheng Lian + 2014-06-02 19:20:23 -0700 + Commit: 862283e, github.com/apache/spark/pull/935 + + [SPARK-1995][SQL] system function upper and lower can be supported + egraldlo + 2014-06-02 18:02:57 -0700 + Commit: ec8be27, github.com/apache/spark/pull/936 + + [SPARK-1958] Calling .collect() on a SchemaRDD should call executeCollect() on the underlying query plan. + Cheng Lian + 2014-06-02 12:09:43 -0700 + Commit: d000ca9, github.com/apache/spark/pull/939 + + [SPARK-1553] Alternating nonnegative least-squares + Tor Myklebust + 2014-06-02 11:48:09 -0700 + Commit: 9a5d482, github.com/apache/spark/pull/460 + + Add landmark-based Shortest Path algorithm to graphx.lib + Ankur Dave , Andres Perez + 2014-06-02 00:00:24 -0700 + Commit: 9535f40, github.com/apache/spark/pull/933 + + Better explanation for how to use MIMA excludes. + Patrick Wendell + 2014-06-01 17:27:05 -0700 + Commit: d17d221, github.com/apache/spark/pull/937 + + Made spark_ec2.py PEP8 compliant. + Reynold Xin + 2014-06-01 15:39:04 -0700 + Commit: eea3aab, github.com/apache/spark/pull/891 + + updated java code blocks in spark SQL guide such that ctx will refer to ... + Yadid Ayzenberg + 2014-05-31 19:44:13 -0700 + Commit: 366c0c4, github.com/apache/spark/pull/932 + + SPARK-1917: fix PySpark import of scipy.special functions + Uri Laserson + 2014-05-31 14:59:09 -0700 + Commit: 5e98967, github.com/apache/spark/pull/866 + + Improve maven plugin configuration + witgo + 2014-05-31 14:36:27 -0700 + Commit: d8c005d, github.com/apache/spark/pull/786 + + SPARK-1839: PySpark RDD#take() shouldn't always read from driver + Aaron Davidson + 2014-05-31 13:04:57 -0700 + Commit: 9909efc, github.com/apache/spark/pull/922 + + Super minor: Close inputStream in SparkSubmitArguments + Aaron Davidson + 2014-05-31 12:36:58 -0700 + Commit: 7d52777, github.com/apache/spark/pull/914 + + [SQL] SPARK-1964 Add timestamp to hive metastore type parser. + Michael Armbrust + 2014-05-31 12:34:22 -0700 + Commit: 1a0da0e, github.com/apache/spark/pull/913 + + Optionally include Hive as a dependency of the REPL. + Michael Armbrust + 2014-05-31 12:24:35 -0700 + Commit: 7463cd2, github.com/apache/spark/pull/801 + + [SPARK-1947] [SQL] Child of SumDistinct or Average should be widened to prevent overflows the same as Sum. + Takuya UESHIN + 2014-05-31 11:30:03 -0700 + Commit: 3ce8149, github.com/apache/spark/pull/902 + + correct tiny comment error + Chen Chao + 2014-05-31 00:06:49 -0700 + Commit: 9ecc40d, github.com/apache/spark/pull/928 + + [SPARK-1959] String "NULL" shouldn't be interpreted as null value + Cheng Lian + 2014-05-30 22:13:11 -0700 + Commit: cf98960, github.com/apache/spark/pull/909 + + SPARK-1976: fix the misleading part in streaming docs + CodingCat + 2014-05-30 22:06:08 -0700 + Commit: 41bfdda, github.com/apache/spark/pull/924 + + updated link to mailing list + nchammas + 2014-05-30 22:04:57 -0700 + Commit: 23ae366, github.com/apache/spark/pull/923 + + Typo: and -> an + Andrew Ash + 2014-05-30 22:02:04 -0700 + Commit: 9c1f204, github.com/apache/spark/pull/927 + + [SPARK-1901] worker should make sure executor has exited before updating executor's info + Zhen Peng + 2014-05-30 10:11:02 -0700 + Commit: ff562b2, github.com/apache/spark/pull/854 + + [SPARK-1971] Update MIMA to compare against Spark 1.0.0 + Prashant Sharma + 2014-05-30 01:13:51 -0700 + Commit: 79fa8fd, github.com/apache/spark/pull/910 + + [SPARK-1566] consolidate programming guide, and general doc updates + Matei Zaharia + 2014-05-30 00:34:33 -0700 + Commit: c8bf413, github.com/apache/spark/pull/896 + + [SPARK-1820] Make GenerateMimaIgnore @DeveloperApi annotation aware. + Prashant Sharma , nikhil7sh + 2014-05-29 23:20:20 -0700 + Commit: eeee978, github.com/apache/spark/pull/904 + + initial version of LPA + Ankur Dave , haroldsultan , Harold Sultan + 2014-05-29 15:39:25 -0700 + Commit: b7e28fa, github.com/apache/spark/pull/905 + + [SPARK-1368][SQL] Optimized HiveTableScan + Cheng Lian + 2014-05-29 15:24:03 -0700 + Commit: 8f7141f, github.com/apache/spark/pull/758 + + SPARK-1935: Explicitly add commons-codec 1.5 as a dependency. + Yin Huai + 2014-05-29 09:07:39 -0700 + Commit: 60b89fe, github.com/apache/spark/pull/889 + + Added doctest and method description in context.py + Jyotiska NK + 2014-05-28 23:08:39 -0700 + Commit: 9cff1dd, github.com/apache/spark/pull/187 + + [SPARK-1712]: TaskDescription instance is too big causes Spark to hang + witgo + 2014-05-28 15:57:05 -0700 + Commit: 4dbb27b, github.com/apache/spark/pull/694 + + Spark 1916 + David Lemieux + 2014-05-28 15:50:35 -0700 + Commit: 4312cf0, github.com/apache/spark/pull/865 + + Organize configuration docs + Patrick Wendell + 2014-05-28 15:49:54 -0700 + Commit: 7801d44, github.com/apache/spark/pull/880 + + Fix doc about NetworkWordCount/JavaNetworkWordCount usage of spark streaming + jmu + 2014-05-27 22:41:47 -0700 + Commit: 82eadc3, github.com/apache/spark/pull/826 + + [SPARK-1938] [SQL] ApproxCountDistinctMergeFunction should return Int value. + Takuya UESHIN + 2014-05-27 22:17:50 -0700 + Commit: 9df8683, github.com/apache/spark/pull/893 + + [SQL] SPARK-1922 + LY Lai + 2014-05-27 16:08:38 -0700 + Commit: 0682567, github.com/apache/spark/pull/873 + + [SPARK-1915] [SQL] AverageFunction should not count if the evaluated value is null. + Takuya UESHIN + 2014-05-27 14:55:23 -0700 + Commit: 3b0baba, github.com/apache/spark/pull/862 + + [SPARK-1926] [SQL] Nullability of Max/Min/First should be true. + Takuya UESHIN + 2014-05-27 14:53:57 -0700 + Commit: d1375a2, github.com/apache/spark/pull/881 + + bugfix worker DriverStateChanged state should match DriverState.FAILED + lianhuiwang + 2014-05-27 11:53:38 -0700 + Commit: 95e4c9c, github.com/apache/spark/pull/864 + + SPARK-1932: Fix race conditions in onReceiveCallback and cachedPeers + zsxwing + 2014-05-26 23:17:39 -0700 + Commit: 549830b, github.com/apache/spark/pull/887 + + SPARK-1933: Throw a more meaningful exception when a directory is passed to addJar/addFile. + Reynold Xin + 2014-05-26 22:05:23 -0700 + Commit: 90e281b, github.com/apache/spark/pull/888 + + Updated dev Python scripts to make them PEP8 compliant. + Reynold Xin + 2014-05-26 21:40:52 -0700 + Commit: 9ed3719, github.com/apache/spark/pull/875 + + Fixed the error message for OutOfMemoryError in DAGScheduler. + Reynold Xin + 2014-05-26 21:31:27 -0700 + Commit: ef690e1 + + SPARK-1929 DAGScheduler suspended by local task OOM + Zhen Peng + 2014-05-26 21:30:25 -0700 + Commit: 8d271c9, github.com/apache/spark/pull/883 + + [SPARK-1931] Reconstruct routing tables in Graph.partitionBy + Ankur Dave + 2014-05-26 16:10:22 -0700 + Commit: 56c771c, github.com/apache/spark/pull/885 + + SPARK-1925: Replace '&' with '&&' + zsxwing + 2014-05-26 14:34:58 -0700 + Commit: cb7fe50, github.com/apache/spark/pull/879 + + Fix scalastyle warnings in yarn alpha + witgo + 2014-05-26 13:16:35 -0700 + Commit: bee6c4f, github.com/apache/spark/pull/884 + + [SPARK-1914] [SQL] Simplify CountFunction not to traverse to evaluate all child expressions. + Takuya UESHIN + 2014-05-26 00:17:20 -0700 + Commit: d6395d8, github.com/apache/spark/pull/861 + + HOTFIX: Add no-arg SparkContext constructor in Java + Patrick Wendell + 2014-05-25 20:13:32 -0700 + Commit: b6d22af, github.com/apache/spark/pull/878 + + [SQL] Minor: Introduce SchemaRDD#aggregate() for simple aggregations + Aaron Davidson + 2014-05-25 18:37:44 -0700 + Commit: c3576ff, github.com/apache/spark/pull/874 + + SPARK-1903 Document Spark's network connections + Andrew Ash + 2014-05-25 17:15:47 -0700 + Commit: 0659529, github.com/apache/spark/pull/856 + + Fix PEP8 violations in Python mllib. + Reynold Xin + 2014-05-25 17:15:01 -0700 + Commit: d33d3c6, github.com/apache/spark/pull/871 + + Python docstring update for sql.py. + Reynold Xin + 2014-05-25 16:04:17 -0700 + Commit: 14f0358, github.com/apache/spark/pull/869 + + Fix PEP8 violations in examples/src/main/python. + Reynold Xin + 2014-05-25 14:48:27 -0700 + Commit: d79c2b2, github.com/apache/spark/pull/870 + + Added license header for tox.ini. + Reynold Xin + 2014-05-25 01:47:08 -0700 + Commit: 55fddf9 + + SPARK-1822: Some minor cleanup work on SchemaRDD.count() + Reynold Xin + 2014-05-25 01:44:49 -0700 + Commit: d66642e, github.com/apache/spark/pull/868 + + Added PEP8 style configuration file. + Reynold Xin + 2014-05-25 01:32:15 -0700 + Commit: 5c7faec, github.com/apache/spark/pull/872 + + [SPARK-1822] SchemaRDD.count() should use query optimizer + Kan Zhang + 2014-05-25 00:06:42 -0700 + Commit: 6052db9, github.com/apache/spark/pull/841 + + spark-submit: add exec at the end of the script + Colin Patrick Mccabe + 2014-05-24 22:39:27 -0700 + Commit: 6e9fb63, github.com/apache/spark/pull/858 + + [SPARK-1913][SQL] Bug fix: column pruning error in Parquet support + Cheng Lian + 2014-05-24 20:42:01 -0700 + Commit: 5afe6af, github.com/apache/spark/pull/863 + + [SPARK-1886] check executor id existence when executor exit + Zhen Peng + 2014-05-24 20:40:19 -0700 + Commit: 4e4831b, github.com/apache/spark/pull/827 + + SPARK-1911: Emphasize that Spark jars should be built with Java 6. + Patrick Wendell + 2014-05-24 18:27:00 -0700 + Commit: 75a0327, github.com/apache/spark/pull/859 + + [SPARK-1900 / 1918] PySpark on YARN is broken + Andrew Or + 2014-05-24 18:01:49 -0700 + Commit: 5081a0a, github.com/apache/spark/pull/853 + + Update LBFGSSuite.scala + baishuo(白硕) + 2014-05-23 13:02:40 -0700 + Commit: a08262d, github.com/apache/spark/pull/815 + + Updated scripts for auditing releases + Tathagata Das + 2014-05-22 20:48:55 -0700 + Commit: b2bdd0e, github.com/apache/spark/pull/844 + + [SPARK-1896] Respect spark.master (and --master) before MASTER in spark-shell + Andrew Or + 2014-05-22 20:32:27 -0700 + Commit: cce7745, github.com/apache/spark/pull/846 + + [SPARK-1897] Respect spark.jars (and --jars) in spark-shell + Andrew Or + 2014-05-22 20:25:41 -0700 + Commit: 8edbee7, github.com/apache/spark/pull/849 + + Fix UISuite unit test that fails under Jenkins contention + Aaron Davidson + 2014-05-22 15:11:05 -0700 + Commit: f9f5fd5, github.com/apache/spark/pull/857 + + [SPARK-1870] Make spark-submit --jars work in yarn-cluster mode. + Xiangrui Meng + 2014-05-22 01:52:50 -0700 + Commit: dba3140, github.com/apache/spark/pull/848 + + Configuration documentation updates + Reynold Xin + 2014-05-21 18:49:12 -0700 + Commit: 2a948e7, github.com/apache/spark/pull/851 + + [SPARK-1889] [SQL] Apply splitConjunctivePredicates to join condition while finding join ke... + Takuya UESHIN + 2014-05-21 15:37:47 -0700 + Commit: bb88875, github.com/apache/spark/pull/836 + + [SPARK-1519] Support minPartitions param of wholeTextFiles() in PySpark + Kan Zhang + 2014-05-21 13:26:53 -0700 + Commit: f18fd05, github.com/apache/spark/pull/697 + + [Typo] Stoped -> Stopped + Andrew Or + 2014-05-21 11:59:05 -0700 + Commit: ba5d4a9, github.com/apache/spark/pull/847 + + [Minor] Move JdbcRDDSuite to the correct package + Andrew Or + 2014-05-21 01:25:10 -0700 + Commit: 7c79ef7, github.com/apache/spark/pull/839 + + [Docs] Correct example of creating a new SparkConf + Andrew Or + 2014-05-21 01:23:34 -0700 + Commit: 1014668, github.com/apache/spark/pull/842 + + [SPARK-1250] Fixed misleading comments in bin/pyspark, bin/spark-class + Sumedh Mungee + 2014-05-21 01:22:25 -0700 + Commit: 6e33738, github.com/apache/spark/pull/843 + + [Hotfix] Blacklisted flaky HiveCompatibility test + Tathagata Das + 2014-05-20 10:27:12 -0700 + Commit: 7f0cfe4, github.com/apache/spark/pull/838 + + [Spark 1877] ClassNotFoundException when loading RDD with serialized objects + Tathagata Das , Ghidireac + 2014-05-19 22:36:24 -0700 + Commit: 52eb54d, github.com/apache/spark/pull/835 + + [SPARK-1874][MLLIB] Clean up MLlib sample data + Xiangrui Meng + 2014-05-19 21:29:33 -0700 + Commit: bcb9dce, github.com/apache/spark/pull/833 + + SPARK-1689: Spark application should die when removed by Master + Aaron Davidson + 2014-05-19 20:55:26 -0700 + Commit: b0ce22e, github.com/apache/spark/pull/832 + + [SPARK-1875]NoClassDefFoundError: StringUtils when building with hadoop 1.x and hive + witgo + 2014-05-19 19:40:29 -0700 + Commit: 6a2c5c6, github.com/apache/spark/pull/824 + + SPARK-1879. Increase MaxPermSize since some of our builds have many classes + Matei Zaharia + 2014-05-19 18:42:28 -0700 + Commit: 5af99d7, github.com/apache/spark/pull/823 + + SPARK-1878: Fix the incorrect initialization order + zsxwing + 2014-05-19 16:41:31 -0700 + Commit: 1811ba8, github.com/apache/spark/pull/822 + + [SPARK-1876] Windows fixes to deal with latest distribution layout changes + Matei Zaharia + 2014-05-19 15:02:35 -0700 + Commit: 7b70a70, github.com/apache/spark/pull/819 + + [WIP][SPARK-1871][MLLIB] Improve MLlib guide for v1.0 + Xiangrui Meng + 2014-05-18 17:00:57 -0700 + Commit: df0aa83, github.com/apache/spark/pull/816 + + SPARK-1873: Add README.md file when making distributions + Patrick Wendell + 2014-05-18 16:51:53 -0700 + Commit: 4ce4793, github.com/apache/spark/pull/818 + + Fix spark-submit path in spark-shell & pyspark + Neville Li + 2014-05-18 13:31:23 -0700 + Commit: ebcd2d6, github.com/apache/spark/pull/812 + + Make deprecation warning less severe + Patrick Wendell + 2014-05-16 22:58:47 -0700 + Commit: 442808a, github.com/apache/spark/pull/810 + + [SPARK-1824] Remove from Python examples + Andrew Or + 2014-05-16 22:36:23 -0700 + Commit: cf6cbe9, github.com/apache/spark/pull/802 + + [SPARK-1808] Route bin/pyspark through Spark submit + Andrew Or + 2014-05-16 22:34:38 -0700 + Commit: 4b8ec6f, github.com/apache/spark/pull/799 + + Version bump of spark-ec2 scripts + Patrick Wendell + 2014-05-16 21:42:14 -0700 + Commit: c0ab85d, github.com/apache/spark/pull/809 + + SPARK-1864 Look in spark conf instead of system properties when propagating configuration to executors. + Michael Armbrust + 2014-05-16 20:25:10 -0700 + Commit: a80a6a1, github.com/apache/spark/pull/808 + + Tweaks to Mesos docs + Matei Zaharia + 2014-05-16 17:35:05 -0700 + Commit: fed6303, github.com/apache/spark/pull/806 + + SPARK-1487 [SQL] Support record filtering via predicate pushdown in Parquet + Andre Schumacher + 2014-05-16 13:41:41 -0700 + Commit: 40d6acd, github.com/apache/spark/pull/511 + + [SQL] Implement between in hql + Michael Armbrust + 2014-05-16 11:47:00 -0700 + Commit: 032d663, github.com/apache/spark/pull/804 + + bugfix: overflow of graphx Edge compare function + Zhen Peng + 2014-05-16 11:37:18 -0700 + Commit: fa6de40, github.com/apache/spark/pull/769 + + HOTFIX: Duplication of hbase version + Patrick Wendell + 2014-05-15 23:33:27 -0700 + Commit: e304eb9 + + SPARK-1862: Support for MapR in the Maven build. + Patrick Wendell + 2014-05-15 23:31:43 -0700 + Commit: 17702e2, github.com/apache/spark/pull/803 + + [Spark-1461] Deferred Expression Evaluation (short-circuit evaluation) + Cheng Hao + 2014-05-15 22:12:34 -0700 + Commit: a20fea9, github.com/apache/spark/pull/446 + + SPARK-1860: Do not cleanup application work/ directories by default + Aaron Davidson + 2014-05-15 21:37:58 -0700 + Commit: bb98eca, github.com/apache/spark/pull/800 + + Typos in Spark + Huajian Mao + 2014-05-15 18:20:16 -0700 + Commit: 94c5139, github.com/apache/spark/pull/798 + + Fixes a misplaced comment. + Prashant Sharma + 2014-05-15 16:58:37 -0700 + Commit: e1e3416, github.com/apache/spark/pull/788 + + [SQL] Fix tiny/small ints from HiveMetastore. + Michael Armbrust + 2014-05-15 16:50:42 -0700 + Commit: a4aafe5, github.com/apache/spark/pull/797 + + SPARK-1803 Replaced colon in filenames with a dash + Stevo Slavić , Stevo Slavic + 2014-05-15 16:44:14 -0700 + Commit: e66e31b, github.com/apache/spark/pull/739 + + SPARK-1851. Upgrade Avro dependency to 1.7.6 so Spark can read Avro file... + Sandy Ryza + 2014-05-15 16:35:39 -0700 + Commit: 08e7606, github.com/apache/spark/pull/795 + + [SPARK-1741][MLLIB] add predict(JavaRDD) to RegressionModel, ClassificationModel, and KMeans + Xiangrui Meng + 2014-05-15 11:59:59 -0700 + Commit: d52761d, github.com/apache/spark/pull/670 + + [SPARK-1819] [SQL] Fix GetField.nullable. + Takuya UESHIN + 2014-05-15 11:21:33 -0700 + Commit: 94c9d6f, github.com/apache/spark/pull/757 + + [SPARK-1845] [SQL] Use AllScalaRegistrar for SparkSqlSerializer to register serializers of ... + Takuya UESHIN + 2014-05-15 11:20:21 -0700 + Commit: db8cc6f, github.com/apache/spark/pull/790 + + SPARK-1846 Ignore logs directory in RAT checks + Andrew Ash + 2014-05-15 11:05:39 -0700 + Commit: 3abe2b7, github.com/apache/spark/pull/793 + + HOTFIX: Don't build Javadoc in Maven when creating releases. + Patrick Wendell + 2014-05-14 23:48:03 -0700 + Commit: 514157f + + fix different versions of commons-lang dependency and apache/spark#746 addendum + witgo + 2014-05-14 22:26:26 -0700 + Commit: bae07e3, github.com/apache/spark/pull/754 + + Package docs + Prashant Sharma , Patrick Wendell + 2014-05-14 22:24:41 -0700 + Commit: 4632427, github.com/apache/spark/pull/785 + + Documentation: Encourage use of reduceByKey instead of groupByKey. + Patrick Wendell + 2014-05-14 22:24:04 -0700 + Commit: 21570b4, github.com/apache/spark/pull/784 + + Add language tabs and Python version to interactive part of quick-start + Matei Zaharia + 2014-05-14 21:45:20 -0700 + Commit: f10de04, github.com/apache/spark/pull/782 + + [SPARK-1840] SparkListenerBus prints out scary error message when terminated normally + Tathagata Das + 2014-05-14 21:13:41 -0700 + Commit: ad4e60e, github.com/apache/spark/pull/783 + + default task number misleading in several places + Chen Chao + 2014-05-14 18:20:20 -0700 + Commit: 2f63995, github.com/apache/spark/pull/766 + + [SPARK-1826] fix the head notation of package object dsl + wangfei + 2014-05-14 17:59:11 -0700 + Commit: 44165fc, github.com/apache/spark/pull/765 + + [Typo] propertes -> properties + andrewor14 + 2014-05-14 17:54:53 -0700 + Commit: 9ad096d, github.com/apache/spark/pull/780 + + [SPARK-1696][MLLIB] use alpha in dense dspr + Xiangrui Meng + 2014-05-14 17:18:30 -0700 + Commit: e3d72a7, github.com/apache/spark/pull/778 + + String interpolation + some other small changes + Jacek Laskowski + 2014-05-14 15:45:52 -0700 + Commit: 601e371, github.com/apache/spark/pull/748 + + [FIX] do not load defaults when testing SparkConf in pyspark + Xiangrui Meng + 2014-05-14 14:57:17 -0700 + Commit: 94c6c06, github.com/apache/spark/pull/775 + + SPARK-1833 - Have an empty SparkContext constructor. + Patrick Wendell + 2014-05-14 12:53:30 -0700 + Commit: 65533c7, github.com/apache/spark/pull/774 + + SPARK-1829 Sub-second durations shouldn't round to "0 s" + Andrew Ash + 2014-05-14 12:01:14 -0700 + Commit: a3315d7, github.com/apache/spark/pull/768 + + Fix: sbt test throw an java.lang.OutOfMemoryError: PermGen space + witgo + 2014-05-14 11:19:26 -0700 + Commit: fde82c1, github.com/apache/spark/pull/773 + + [SPARK-1620] Handle uncaught exceptions in function run by Akka scheduler + Mark Hamstra + 2014-05-14 10:07:25 -0700 + Commit: 17f3075, github.com/apache/spark/pull/622 + + SPARK-1828: Created forked version of hive-exec that doesn't bundle other dependencies + Patrick Wendell + 2014-05-14 09:51:01 -0700 + Commit: d58cb33, github.com/apache/spark/pull/767 + + SPARK-1818 Freshen Mesos documentation + Andrew Ash + 2014-05-14 09:45:33 -0700 + Commit: d1d41cc, github.com/apache/spark/pull/756 + + SPARK-1827. LICENSE and NOTICE files need a refresh to contain transitive dependency info + Sean Owen + 2014-05-14 09:38:33 -0700 + Commit: 2e5a7cd, github.com/apache/spark/pull/770 + + Fixed streaming examples docs to use run-example instead of spark-submit + Tathagata Das + 2014-05-14 04:17:32 -0700 + Commit: 68f28da, github.com/apache/spark/pull/722 + + [SPARK-1769] Executor loss causes NPE race condition + Andrew Or + 2014-05-14 00:54:33 -0700 + Commit: 69f7502, github.com/apache/spark/pull/762 + + Fix dep exclusion: avro-ipc, not avro, depends on netty. + Marcelo Vanzin + 2014-05-14 00:37:57 -0700 + Commit: 54ae832, github.com/apache/spark/pull/763 + + SPARK-1801. expose InterruptibleIterator and TaskKilledException in deve... + Koert Kuipers + 2014-05-14 00:10:12 -0700 + Commit: b22952f, github.com/apache/spark/pull/764 + + [SQL] Improve column pruning. + Michael Armbrust + 2014-05-13 23:27:22 -0700 + Commit: 6ce0884, github.com/apache/spark/pull/729 + + Revert "[SPARK-1784] Add a new partitioner to allow specifying # of keys per partition" + Patrick Wendell + 2014-05-13 23:24:51 -0700 + Commit: 7bb9a52 + + Implement ApproximateCountDistinct for SparkSql + larvaboy + 2014-05-13 21:26:08 -0700 + Commit: c33b8dc, github.com/apache/spark/pull/737 + + [SPARK-1784] Add a new partitioner to allow specifying # of keys per partition + Syed Hashmi + 2014-05-13 21:24:23 -0700 + Commit: 92cebad, github.com/apache/spark/pull/721 + + [SQL] Make it possible to create Java/Python SQLContexts from an existing Scala SQLContext. + Michael Armbrust + 2014-05-13 21:23:51 -0700 + Commit: 4423386, github.com/apache/spark/pull/761 + + [SPARK-1527] change rootDir*.getName to rootDir*.getAbsolutePath + Ye Xianjin + 2014-05-13 19:03:51 -0700 + Commit: 753b04d, github.com/apache/spark/pull/436 + + [SPARK-1816] LiveListenerBus dies if a listener throws an exception + Andrew Or + 2014-05-13 18:32:32 -0700 + Commit: 5c0dafc, github.com/apache/spark/pull/759 + + SPARK-1791 - SVM implementation does not use threshold parameter + Andrew Tulloch + 2014-05-13 17:31:27 -0700 + Commit: d1e4874, github.com/apache/spark/pull/725 + + SPARK-571: forbid return statements in cleaned closures + William Benton + 2014-05-13 13:45:23 -0700 + Commit: 16ffadc, github.com/apache/spark/pull/717 + + BUILD: Add more content to make-distribution.sh. + Patrick Wendell + 2014-05-12 23:02:54 -0700 + Commit: 52d9052 + + SPARK-1815. SparkContext should not be marked DeveloperApi + Sandy Ryza + 2014-05-12 20:08:30 -0700 + Commit: 2792bd0, github.com/apache/spark/pull/753 + + [SPARK-1753 / 1773 / 1814] Update outdated docs for spark-submit, YARN, standalone etc. + Andrew Or + 2014-05-12 19:44:14 -0700 + Commit: 2ffd1ea, github.com/apache/spark/pull/701 + + [SPARK-1780] Non-existent SPARK_DAEMON_OPTS is lurking around + Andrew Or + 2014-05-12 19:42:35 -0700 + Commit: ba96bb3, github.com/apache/spark/pull/751 + + SPARK-1757 Failing test for saving null primitives with .saveAsParquetFile() + Andrew Ash , Michael Armbrust + 2014-05-12 19:23:39 -0700 + Commit: 156df87, github.com/apache/spark/pull/690 + + Modify a typo in monitoring.md + Kousuke Saruta + 2014-05-12 19:21:06 -0700 + Commit: 9cf9f18, github.com/apache/spark/pull/698 + + L-BFGS Documentation + DB Tsai + 2014-05-12 19:20:24 -0700 + Commit: 5c2275d, github.com/apache/spark/pull/702 + + Typo: resond -> respond + Andrew Ash + 2014-05-12 18:46:28 -0700 + Commit: a5150d1, github.com/apache/spark/pull/743 + + [SQL] Make Hive Metastore conversion functions publicly visible. + Michael Armbrust + 2014-05-12 18:40:30 -0700 + Commit: 2f1a337, github.com/apache/spark/pull/750 + + Adding hadoop-2.2 profile to the build + Patrick Wendell + 2014-05-12 15:40:48 -0700 + Commit: 3e13b8c + + [SPARK-1736] Spark submit for Windows + Andrew Or + 2014-05-12 17:39:40 -0700 + Commit: beb9cba, github.com/apache/spark/pull/745 + + SPARK-1802. (Addendium) Audit dependency graph when Spark is built with -Pyarn + Sean Owen + 2014-05-12 17:35:29 -0700 + Commit: 4b31f4e, github.com/apache/spark/pull/746 + + SPARK-1623: Use File objects instead of String's in HTTPBroadcast + Patrick Wendell + 2014-05-12 17:27:28 -0700 + Commit: 925d8b2, github.com/apache/spark/pull/749 + + Rename testExecutorEnvs --> executorEnvs. + Patrick Wendell + 2014-05-12 17:09:13 -0700 + Commit: 3ce526b, github.com/apache/spark/pull/747 + + SPARK-1802. Audit dependency graph when Spark is built with -Phive + Sean Owen + 2014-05-12 14:17:25 -0700 + Commit: 8586bf5, github.com/apache/spark/pull/744 + + SPARK-1798. Tests should clean up temp files + Sean Owen + 2014-05-12 14:16:19 -0700 + Commit: 7120a29, github.com/apache/spark/pull/732 + + BUILD: Include Hive with default packages when creating a release + Patrick Wendell + 2014-05-12 13:20:23 -0700 + Commit: 1e4a65e + + SPARK-1786: Reopening PR 724 + Ankur Dave , Joseph E. Gonzalez + 2014-05-12 13:05:24 -0700 + Commit: 0e2bde2, github.com/apache/spark/pull/742 + + SPARK-1806: Upgrade Mesos dependency to 0.18.1 + Bernardo Gomez Palacio + 2014-05-12 11:10:28 -0700 + Commit: d9c97ba, github.com/apache/spark/pull/741 + + SPARK-1772 Stop catching Throwable, let Executors die + Aaron Davidson + 2014-05-12 11:08:52 -0700 + Commit: 3af1f38, github.com/apache/spark/pull/715 + + Revert "SPARK-1786: Edge Partition Serialization" + Patrick Wendell + 2014-05-12 10:49:03 -0700 + Commit: af15c82 + + SPARK-1786: Edge Partition Serialization + Ankur Dave , Joseph E. Gonzalez + 2014-05-11 19:20:42 -0700 + Commit: a6b02fb, github.com/apache/spark/pull/724 + + Fix error in 2d Graph Partitioner + Joseph E. Gonzalez + 2014-05-11 18:33:46 -0700 + Commit: f938a15, github.com/apache/spark/pull/709 + + SPARK-1652: Set driver memory correctly in spark-submit. + Patrick Wendell + 2014-05-11 18:17:34 -0700 + Commit: 05c9aa9, github.com/apache/spark/pull/730 + + SPARK-1770: Load balance elements when repartitioning. + Patrick Wendell + 2014-05-11 17:11:55 -0700 + Commit: 7d9cc92, github.com/apache/spark/pull/727 + + remove outdated runtime Information scala home + witgo + 2014-05-11 14:34:27 -0700 + Commit: 6bee01d, github.com/apache/spark/pull/728 + + Enabled incremental build that comes with sbt 0.13.2 + Prashant Sharma + 2014-05-10 21:08:04 -0700 + Commit: 70bcdef, github.com/apache/spark/pull/525 + + [SPARK-1774] Respect SparkSubmit --jars on YARN (client) + Andrew Or + 2014-05-10 20:58:02 -0700 + Commit: 83e0424, github.com/apache/spark/pull/710 + + SPARK-1789. Multiple versions of Netty dependencies cause FlumeStreamSuite failure + Sean Owen + 2014-05-10 20:50:40 -0700 + Commit: 2b7bd29, github.com/apache/spark/pull/723 + + Unify GraphImpl RDDs + other graph load optimizations + Ankur Dave + 2014-05-10 14:48:07 -0700 + Commit: 905173d, github.com/apache/spark/pull/497 + + [SPARK-1690] Tolerating empty elements when saving Python RDD to text files + Kan Zhang + 2014-05-10 14:01:08 -0700 + Commit: 6c2691d, github.com/apache/spark/pull/644 + + Add Python includes to path before depickling broadcast values + Bouke van der Bijl + 2014-05-10 13:02:13 -0700 + Commit: 3776f2f, github.com/apache/spark/pull/656 + + fix broken in link in python docs + Andy Konwinski + 2014-05-10 12:46:51 -0700 + Commit: c05d11b, github.com/apache/spark/pull/650 + + SPARK-1708. Add a ClassTag on Serializer and things that depend on it + Matei Zaharia + 2014-05-10 12:10:24 -0700 + Commit: 7eefc9d, github.com/apache/spark/pull/700 + + [SPARK-1778] [SQL] Add 'limit' transformation to SchemaRDD. + Takuya UESHIN + 2014-05-10 12:03:27 -0700 + Commit: 8e94d27, github.com/apache/spark/pull/711 + + [SQL] Upgrade parquet library. + Michael Armbrust + 2014-05-10 11:48:01 -0700 + Commit: 4d60553, github.com/apache/spark/pull/684 + + [SPARK-1644] The org.datanucleus:* should not be packaged into spark-assembly-*.jar + witgo + 2014-05-10 10:15:04 -0700 + Commit: 5615108, github.com/apache/spark/pull/688 + + SPARK-1686: keep schedule() calling in the main thread + CodingCat + 2014-05-09 21:50:23 -0700 + Commit: 2f452cb, github.com/apache/spark/pull/639 + + SPARK-1770: Revert accidental(?) fix + Aaron Davidson + 2014-05-09 14:51:34 -0700 + Commit: 59577df, github.com/apache/spark/pull/716 + + [SPARK-1760]: fix building spark with maven documentation + witgo + 2014-05-09 01:51:26 -0700 + Commit: bd67551, github.com/apache/spark/pull/712 + + Converted bang to ask to avoid scary warning when a block is removed + Tathagata Das + 2014-05-08 22:34:08 -0700 + Commit: 32868f3, github.com/apache/spark/pull/708 + + MINOR: Removing dead code. + Patrick Wendell + 2014-05-08 22:33:06 -0700 + Commit: 4c60fd1 + + SPARK-1775: Unneeded lock in ShuffleMapTask.deserializeInfo + Sandeep + 2014-05-08 22:30:17 -0700 + Commit: 7db47c4, github.com/apache/spark/pull/707 + + SPARK-1565 (Addendum): Replace `run-example` with `spark-submit`. + Patrick Wendell + 2014-05-08 22:26:17 -0700 + Commit: 06b15ba, github.com/apache/spark/pull/704 + + [SPARK-1631] Correctly set the Yarn app name when launching the AM. + Marcelo Vanzin + 2014-05-08 20:46:11 -0700 + Commit: 3f779d8, github.com/apache/spark/pull/539 + + [SPARK-1755] Respect SparkSubmit --name on YARN + Andrew Or + 2014-05-08 20:45:29 -0700 + Commit: 8b78412, github.com/apache/spark/pull/699 + + Include the sbin/spark-config.sh in spark-executor + Bouke van der Bijl + 2014-05-08 20:43:37 -0700 + Commit: 2fd2752, github.com/apache/spark/pull/651 + + Bug fix of sparse vector conversion + Funes , funes + 2014-05-08 17:54:10 -0700 + Commit: 191279c, github.com/apache/spark/pull/661 + + [SPARK-1157][MLlib] Bug fix: lossHistory should exclude rejection steps, and remove miniBatch + DB Tsai + 2014-05-08 17:53:22 -0700 + Commit: 910a13b, github.com/apache/spark/pull/582 + + MLlib documentation fix + DB Tsai + 2014-05-08 17:52:32 -0700 + Commit: d38febe, github.com/apache/spark/pull/703 + + [SPARK-1754] [SQL] Add missing arithmetic DSL operations. + Takuya UESHIN + 2014-05-08 15:31:47 -0700 + Commit: 322b180, github.com/apache/spark/pull/689 + + Fixing typo in als.py + Evan Sparks + 2014-05-08 13:07:30 -0700 + Commit: 5c5e7d5, github.com/apache/spark/pull/696 + + [SPARK-1745] Move interrupted flag from TaskContext constructor (minor) + Andrew Or + 2014-05-08 12:13:07 -0700 + Commit: c3f8b78, github.com/apache/spark/pull/675 + + SPARK-1565, update examples to be used with spark-submit script. + Prashant Sharma + 2014-05-08 10:23:05 -0700 + Commit: 44dd57f, github.com/apache/spark/pull/552 + + [SQL] Improve SparkSQL Aggregates + Michael Armbrust + 2014-05-08 01:08:43 -0400 + Commit: 19c8fb0, github.com/apache/spark/pull/683 + + Use numpy directly for matrix multiply. + Evan Sparks + 2014-05-08 00:24:36 -0400 + Commit: 6ed7e2c, github.com/apache/spark/pull/687 + + SPARK-1668: Add implicit preference as an option to examples/MovieLensALS + Sandeep + 2014-05-08 00:15:05 -0400 + Commit: 108c4c1, github.com/apache/spark/pull/597 + + SPARK-1544 Add support for deep decision trees. + Manish Amde , manishamde , Evan Sparks + 2014-05-07 17:08:38 -0700 + Commit: f269b01, github.com/apache/spark/pull/475 + + Update GradientDescentSuite.scala + baishuo(白硕) + 2014-05-07 16:02:55 -0700 + Commit: 0c19bb1, github.com/apache/spark/pull/588 + + [SPARK-1743][MLLIB] add loadLibSVMFile and saveAsLibSVMFile to pyspark + Xiangrui Meng + 2014-05-07 16:01:11 -0700 + Commit: 3188553, github.com/apache/spark/pull/672 + + SPARK-1569 Spark on Yarn, authentication broken by pr299 + Thomas Graves + 2014-05-07 15:51:53 -0700 + Commit: 4bec84b, github.com/apache/spark/pull/649 + + [SPARK-1688] Propagate PySpark worker stderr to driver + Andrew Or + 2014-05-07 14:35:22 -0700 + Commit: 5200872, github.com/apache/spark/pull/603 + + Typo fix: fetchting -> fetching + Andrew Ash + 2014-05-07 17:24:49 -0400 + Commit: d00981a, github.com/apache/spark/pull/680 + + Nicer logging for SecurityManager startup + Andrew Ash + 2014-05-07 17:24:12 -0400 + Commit: 7f6f4a1, github.com/apache/spark/pull/678 + + [SQL] Fix Performance Issue in data type casting + Cheng Hao + 2014-05-07 16:54:58 -0400 + Commit: ca43186, github.com/apache/spark/pull/679 + + SPARK-1579: Clean up PythonRDD and avoid swallowing IOExceptions + Aaron Davidson + 2014-05-07 09:48:31 -0700 + Commit: 3308722, github.com/apache/spark/pull/640 + + [SPARK-1460] Returning SchemaRDD instead of normal RDD on Set operations... + Kan Zhang + 2014-05-07 09:41:31 -0700 + Commit: 967635a, github.com/apache/spark/pull/448 + + [WIP][Spark-SQL] Optimize the Constant Folding for Expression + Cheng Hao , Michael Armbrust + 2014-05-07 03:37:12 -0400 + Commit: 3eb53bd, github.com/apache/spark/pull/482 + + SPARK-1746: Support setting SPARK_JAVA_OPTS on executors for backwards compatibility + Patrick Wendell + 2014-05-07 00:11:05 -0700 + Commit: 913a0a9, github.com/apache/spark/pull/676 + + [HOTFIX] SPARK-1637: There are some Streaming examples added after the PR #571 was last updated. + Sandeep + 2014-05-06 21:55:05 -0700 + Commit: fdae095, github.com/apache/spark/pull/673 + + Proposal: clarify Scala programming guide on caching ... + Ethan Jewett + 2014-05-06 20:50:08 -0700 + Commit: 48ba3b8, github.com/apache/spark/pull/668 + + SPARK-1727. Correct small compile errors, typos, and markdown issues in (primarly) MLlib docs + Sean Owen + 2014-05-06 20:07:22 -0700 + Commit: 25ad8f9, github.com/apache/spark/pull/653 + + SPARK-1637: Clean up examples for 1.0 + Sandeep + 2014-05-06 17:27:52 -0700 + Commit: a000b5c, github.com/apache/spark/pull/571 + + SPARK-1737: Warn rather than fail when Java 7+ is used to create distributions + Patrick Wendell + 2014-05-06 15:41:46 -0700 + Commit: 39b8b14, github.com/apache/spark/pull/669 + + [SPARK-1549] Add Python support to spark-submit + Matei Zaharia + 2014-05-06 15:12:35 -0700 + Commit: 951a5d9, github.com/apache/spark/pull/664 + + SPARK-1734: spark-submit throws an exception: Exception in thread "main"... + witgo + 2014-05-06 14:17:39 -0700 + Commit: ec09acd, github.com/apache/spark/pull/665 + + [SPARK-1685] Cancel retryTimer on restart of Worker or AppClient + Mark Hamstra + 2014-05-06 12:53:39 -0700 + Commit: fbfe69d, github.com/apache/spark/pull/602 + + Fix two download suggestions in the docs: + Patrick Wendell + 2014-05-06 12:07:46 -0700 + Commit: 7b978c1, github.com/apache/spark/pull/662 + + SPARK-1474: Spark on yarn assembly doesn't include AmIpFilter + Thomas Graves + 2014-05-06 12:00:09 -0700 + Commit: 1e82990, github.com/apache/spark/pull/406 + + Update OpenHashSet.scala + ArcherShao + 2014-05-06 10:12:59 -0700 + Commit: 0a5a468, github.com/apache/spark/pull/667 + + [SQL] SPARK-1732 - Support for null primitive values. + Michael Armbrust + 2014-05-05 22:59:42 -0700 + Commit: 3c64750, github.com/apache/spark/pull/658 + + [SPARK-1735] Add the missing special profiles to make-distribution.sh + Andrew Or + 2014-05-05 22:14:47 -0700 + Commit: a2262cd, github.com/apache/spark/pull/660 + + [SPARK-1678][SPARK-1679] In-memory compression bug fix and made compression configurable, disabled by default + Cheng Lian + 2014-05-05 19:38:59 -0700 + Commit: 6d721c5, github.com/apache/spark/pull/608 + + [SPARK-1594][MLLIB] Cleaning up MLlib APIs and guide + Xiangrui Meng + 2014-05-05 18:32:54 -0700 + Commit: 98750a7, github.com/apache/spark/pull/524 + + Expose SparkListeners and relevant classes as DeveloperApi + Andrew Or + 2014-05-05 18:32:14 -0700 + Commit: ea10b31, github.com/apache/spark/pull/648 + + SPARK-1728. JavaRDDLike.mapPartitionsWithIndex requires ClassTag + Sandy Ryza + 2014-05-05 18:26:34 -0700 + Commit: 8e724dc, github.com/apache/spark/pull/657 + + [SPARK-1681] Include datanucleus jars in Spark Hive distribution + Andrew Or + 2014-05-05 16:28:07 -0700 + Commit: cf0a8f0, github.com/apache/spark/pull/610 + + [SPARK-1504], [SPARK-1505], [SPARK-1558] Updated Spark Streaming guide + Tathagata Das + 2014-05-05 15:28:19 -0700 + Commit: a975a19, github.com/apache/spark/pull/652 + + SPARK-1721: Reset the thread classLoader in the Mesos Executor + Bouke van der Bijl + 2014-05-05 11:19:35 -0700 + Commit: 3292e2a, github.com/apache/spark/pull/620 + + SPARK-1556. jets3t dep doesn't update properly with newer Hadoop versions + Sean Owen + 2014-05-05 10:33:49 -0700 + Commit: 73b0cbc, github.com/apache/spark/pull/629 + + Updated doc for spark.closure.serializer to indicate only Java serializer work. + Reynold Xin + 2014-05-05 00:52:06 -0700 + Commit: f2eb070, github.com/apache/spark/pull/642 + + Address SPARK-1717 + msiddalingaiah + 2014-05-04 21:59:10 -0700 + Commit: bb2bb0c, github.com/apache/spark/pull/641 + + SPARK-1710: spark-submit should print better errors than "InvocationTargetException" + Sandeep + 2014-05-04 20:51:53 -0700 + Commit: b48a55a, github.com/apache/spark/pull/630 + + EC2 script should exit with non-zero code on UsageError + Allan Douglas R. de Oliveira + 2014-05-04 20:36:51 -0700 + Commit: bcb9b7f, github.com/apache/spark/pull/638 + + SPARK-1693: Most of the tests throw a java.lang.SecurityException when s... + witgo + 2014-05-04 17:48:52 -0700 + Commit: d940e4c, github.com/apache/spark/pull/628 + + SPARK-1629. Addendum: Depend on commons lang3 (already used by tachyon) as it's used in ReplSuite, and return to use lang3 utility in Utils.scala + Sean Owen + 2014-05-04 17:43:28 -0700 + Commit: f504157, github.com/apache/spark/pull/635 + + SPARK-1703 Warn users if Spark is run on JRE6 but compiled with JDK7. + Patrick Wendell + 2014-05-04 12:22:23 -0700 + Commit: 0c98a8f, github.com/apache/spark/pull/627 + + SPARK-1663. (Addendum) Fix signature of one version of JavaPairRDDStream.reduceByKeyAndWindow() + Sean Owen + 2014-05-04 11:55:29 -0700 + Commit: 0088ced, github.com/apache/spark/pull/633 + + SPARK-1658: Correctly identify if maven is installed and working + Rahul Singhal + 2014-05-04 11:08:39 -0700 + Commit: e97a2e6, github.com/apache/spark/pull/580 + + The default version of yarn is equal to the hadoop version + witgo + 2014-05-03 23:32:12 -0700 + Commit: fb05432, github.com/apache/spark/pull/626 + + Whitelist Hive Tests + Michael Armbrust + 2014-05-03 23:13:51 -0700 + Commit: 92b2902, github.com/apache/spark/pull/596 + + [SQL] Better logging when applying rules. + Michael Armbrust + 2014-05-03 18:38:44 -0700 + Commit: b295714, github.com/apache/spark/pull/616 + + EC2 configurable workers + Allan Douglas R. de Oliveira + 2014-05-03 16:52:19 -0700 + Commit: 4669a84, github.com/apache/spark/pull/612 + + SPARK-1689 AppClient should indicate app is dead() when removed + Aaron Davidson + 2014-05-03 13:27:10 -0700 + Commit: 34719ba, github.com/apache/spark/pull/605 + + [Bugfix] Tachyon file cleanup logical error + Cheng Lian + 2014-05-03 13:23:52 -0700 + Commit: ce72c72, github.com/apache/spark/pull/575 + + SPARK-1663. Corrections for several compile errors in streaming code examples, and updates to follow API changes + Sean Owen + 2014-05-03 12:31:31 -0700 + Commit: 11d5494, github.com/apache/spark/pull/589 + + [WIP] SPARK-1676: Cache Hadoop UGIs by default to prevent FileSystem leak + Thomas Graves + 2014-05-03 10:59:05 -0700 + Commit: 3d0a02d, github.com/apache/spark/pull/621 + + Update SchemaRDD.scala + ArcherShao + 2014-05-03 00:17:36 -0700 + Commit: 9347565, github.com/apache/spark/pull/619 + + SPARK-1700: Close socket file descriptors on task completion + Aaron Davidson + 2014-05-02 23:55:13 -0700 + Commit: 0a14421, github.com/apache/spark/pull/623 + + SPARK-1492. Update Spark YARN docs to use spark-submit + Sandy Ryza + 2014-05-02 21:42:31 -0700 + Commit: 2b961d8, github.com/apache/spark/pull/601 + + delete no use var + wangfei + 2014-05-02 21:34:54 -0700 + Commit: 4bf24f7, github.com/apache/spark/pull/613 + + SPARK-1695: java8-tests compiler error: package com.google.common.co... + witgo + 2014-05-02 12:40:27 -0700 + Commit: f25ebed, github.com/apache/spark/pull/611 + + Add tests for FileLogger, EventLoggingListener, and ReplayListenerBus + Andrew Or + 2014-05-01 21:42:06 -0700 + Commit: 394d8cb, github.com/apache/spark/pull/591 + + SPARK-1659: improvements spark-submit usage + witgo + 2014-05-01 21:39:40 -0700 + Commit: 40cf6d3, github.com/apache/spark/pull/581 + + fix the spelling mistake + wangfei + 2014-05-01 21:37:22 -0700 + Commit: 55c760f, github.com/apache/spark/pull/614 + + [SQL] SPARK-1661 - Fix regex_serde test + Michael Armbrust + 2014-05-01 21:32:43 -0700 + Commit: a43d9c1, github.com/apache/spark/pull/595 + + SPARK-1691: Support quoted arguments inside of spark-submit. + Patrick Wendell + 2014-05-01 01:15:51 -0700 + Commit: 98b6559, github.com/apache/spark/pull/609 + + Fix SPARK-1629: Spark should inline use of commons-lang `SystemUtils.IS_... + witgo + 2014-04-30 09:49:45 -0700 + Commit: 55100da, github.com/apache/spark/pull/569 + + SPARK-1004. PySpark on YARN + Sandy Ryza + 2014-04-29 23:24:34 -0700 + Commit: ff5be9a, github.com/apache/spark/pull/30 + + Handle the vals that never used + WangTao + 2014-04-29 22:07:20 -0700 + Commit: 7025dda, github.com/apache/spark/pull/565 + + Args for worker rather than master + Chen Chao + 2014-04-29 22:05:40 -0700 + Commit: b3d2ab6, github.com/apache/spark/pull/587 + + [SPARK-1646] Micro-optimisation of ALS + Tor Myklebust + 2014-04-29 22:04:34 -0700 + Commit: 5c0cd5c, github.com/apache/spark/pull/568 + + [SPARK-1674] fix interrupted system call error in pyspark's RDD.pipe + Xiangrui Meng + 2014-04-29 18:06:45 -0700 + Commit: d33df1c, github.com/apache/spark/pull/594 + + SPARK-1588. Restore SPARK_YARN_USER_ENV and SPARK_JAVA_OPTS for YARN. + Sandy Ryza + 2014-04-29 12:54:02 -0700 + Commit: bf8d0aa, github.com/apache/spark/pull/586 + + SPARK-1509: add zipWithIndex zipWithUniqueId methods to java api + witgo + 2014-04-29 11:30:47 -0700 + Commit: 7d15058, github.com/apache/spark/pull/423 + + SPARK-1557 Set permissions on event log files/directories + Thomas Graves + 2014-04-29 09:19:48 -0500 + Commit: 8db0f7e, github.com/apache/spark/pull/538 + + HOTFIX: minor change to release script + Patrick Wendell + 2014-04-29 00:59:38 -0700 + Commit: 9a1184a + + HOTFIX: minor change to release script + Patrick Wendell + 2014-04-29 00:53:32 -0700 + Commit: f04bcaf + + [SPARK-1636][MLLIB] Move main methods to examples + Xiangrui Meng + 2014-04-29 00:41:03 -0700 + Commit: 3f38334, github.com/apache/spark/pull/584 + + Minor fix to python table caching API. + Michael Armbrust + 2014-04-29 00:36:15 -0700 + Commit: 497be3c, github.com/apache/spark/pull/585 + + HOTFIX: Bug in release script + Patrick Wendell + 2014-04-29 00:10:17 -0700 + Commit: 719c8bc + + Improved build configuration + witgo + 2014-04-28 22:50:51 -0700 + Commit: 030f2c2, github.com/apache/spark/pull/480 + + SPARK-1652: Remove incorrect deprecation warning in spark-submit + Patrick Wendell + 2014-04-28 18:14:59 -0700 + Commit: 9f7a095, github.com/apache/spark/pull/578 + + SPARK-1654 and SPARK-1653: Fixes in spark-submit. + Patrick Wendell + 2014-04-28 17:29:22 -0700 + Commit: 949e393, github.com/apache/spark/pull/576 + + SPARK-1652: Spark submit should fail gracefully if YARN not enabled + Patrick Wendell + 2014-04-28 17:26:57 -0700 + Commit: cae054a, github.com/apache/spark/pull/579 + + Changes to dev release script + Patrick Wendell + 2014-04-28 13:58:42 -0700 + Commit: 8421034 + + [SPARK-1633][Streaming] Java API unit test and example for custom streaming receiver in Java + Tathagata Das + 2014-04-28 13:58:09 -0700 + Commit: 1d84964, github.com/apache/spark/pull/558 + + [SQL]Append some missing types for HiveUDF + Cheng Hao + 2014-04-27 23:59:42 -0700 + Commit: f735884, github.com/apache/spark/pull/459 + + Update the import package name for TestHive in sbt shell + Cheng Hao + 2014-04-27 23:57:29 -0700 + Commit: ea01aff, github.com/apache/spark/pull/574 + + Fix SPARK-1609: Executor fails to start when Command.extraJavaOptions contains multiple Java options + witgo + 2014-04-27 19:41:02 -0700 + Commit: 71f4d26, github.com/apache/spark/pull/547 + + SPARK-1145: Memory mapping with many small blocks can cause JVM allocation failures + Patrick Wendell + 2014-04-27 17:40:56 -0700 + Commit: 6b3c6e5, github.com/apache/spark/pull/43 + + HOTFIX: Minor patch to merge script. + Patrick Wendell + 2014-04-27 15:45:17 -0700 + Commit: 3d9fb09 + + SPARK-1651: Delete existing deployment directory + Rahul Singhal + 2014-04-27 15:50:48 -0700 + Commit: eefb90d, github.com/apache/spark/pull/573 + + SPARK-1648 Support closing JIRA's as part of merge script. + Patrick Wendell + 2014-04-27 15:41:57 -0700 + Commit: fe65bee, github.com/apache/spark/pull/570 + + SPARK-1650: Correctly identify maven project version + Rahul Singhal + 2014-04-27 15:17:06 -0700 + Commit: 7b2527d, github.com/apache/spark/pull/572 + + SPARK-1606: Infer user application arguments instead of requiring --arg. + Patrick Wendell + 2014-04-26 19:24:29 -0700 + Commit: aa9a7f5, github.com/apache/spark/pull/563 + + SPARK-1467: Make StorageLevel.apply() factory methods Developer APIs + Sandeep + 2014-04-26 19:04:33 -0700 + Commit: 762af4e, github.com/apache/spark/pull/551 + + [SPARK-1608] [SQL] Fix Cast.nullable when cast from StringType to NumericType/TimestampType. + Takuya UESHIN + 2014-04-26 14:39:54 -0700 + Commit: 8e37ed6, github.com/apache/spark/pull/532 + + add note of how to support table with more than 22 fields + wangfei + 2014-04-26 14:38:42 -0700 + Commit: e6e44e4, github.com/apache/spark/pull/564 + + [Spark-1382] Fix NPE in DStream.slice (updated version of #365) + zsxwing , Tathagata Das + 2014-04-25 19:04:34 -0700 + Commit: 058797c, github.com/apache/spark/pull/562 + + SPARK-1632. Remove unnecessary boxing in compares in ExternalAppendOnlyM... + Sandy Ryza + 2014-04-25 17:55:04 -0700 + Commit: 87cf35c, github.com/apache/spark/pull/559 + + SPARK-1235: manage the DAGScheduler EventProcessActor with supervisor and refactor the DAGScheduler with Akka + CodingCat , Xiangrui Meng , Nan Zhu + 2014-04-25 16:04:48 -0700 + Commit: 027f1b8, github.com/apache/spark/pull/186 + + SPARK-1607. HOTFIX: Fix syntax adapting Int result to Short + Sean Owen + 2014-04-25 14:17:38 -0700 + Commit: df6d814, github.com/apache/spark/pull/556 + + Update KafkaWordCount.scala + baishuo(白硕) + 2014-04-25 13:18:49 -0700 + Commit: 8aaef5c, github.com/apache/spark/pull/523 + + Delete the val that never used + WangTao + 2014-04-25 11:47:01 -0700 + Commit: 25a276d, github.com/apache/spark/pull/553 + + SPARK-1621 Upgrade Chill to 0.3.6 + Matei Zaharia + 2014-04-25 11:12:41 -0700 + Commit: a24d918, github.com/apache/spark/pull/543 + + SPARK-1619 Launch spark-shell with spark-submit + Patrick Wendell + 2014-04-24 23:59:16 -0700 + Commit: dc3b640, github.com/apache/spark/pull/542 + + SPARK-1607. Replace octal literals, removed in Scala 2.11, with hex literals + Sean Owen + 2014-04-24 23:34:00 -0700 + Commit: 6e101f1, github.com/apache/spark/pull/529 + + Call correct stop(). + Aaron Davidson + 2014-04-24 23:22:03 -0700 + Commit: 45ad7f0, github.com/apache/spark/pull/527 + + SPARK-1242 Add aggregate to python rdd + Holden Karau + 2014-04-24 23:07:54 -0700 + Commit: e03bc37, github.com/apache/spark/pull/139 + + Fix [SPARK-1078]: Remove the Unnecessary lift-json dependency + Sandeep + 2014-04-24 21:51:52 -0700 + Commit: 095b518, github.com/apache/spark/pull/536 + + [Typo] In the maven docs: chd -> cdh + Andrew Or + 2014-04-24 21:51:17 -0700 + Commit: 06e82d9, github.com/apache/spark/pull/548 + + Generalize pattern for planning hash joins. + Michael Armbrust + 2014-04-24 21:42:33 -0700 + Commit: 86ff8b1, github.com/apache/spark/pull/418 + + [SPARK-1617] and [SPARK-1618] Improvements to streaming ui and bug fix to socket receiver + Tathagata Das + 2014-04-24 21:34:37 -0700 + Commit: cd12dd9, github.com/apache/spark/pull/540 + + SPARK-1586 Windows build fixes + Mridul Muralidharan + 2014-04-24 20:48:33 -0700 + Commit: 968c018, github.com/apache/spark/pull/505 + + SPARK-1584: Upgrade Flume dependency to 1.4.0 + tmalaska + 2014-04-24 20:31:17 -0700 + Commit: d5c6ae6, github.com/apache/spark/pull/507 + + [SPARK-986]: Job cancelation for PySpark + Ahir Reddy + 2014-04-24 20:21:10 -0700 + Commit: e53eb4f, github.com/apache/spark/pull/541 + + [SPARK-1615] Synchronize accesses to the LiveListenerBus' event queue + Andrew Or + 2014-04-24 20:18:15 -0700 + Commit: ee6f7e2, github.com/apache/spark/pull/544 + + [SPARK-1510] Spark Streaming metrics source for metrics system + jerryshao , Tathagata Das + 2014-04-24 18:56:57 -0700 + Commit: 80429f3, github.com/apache/spark/pull/545 + + Spark 1489 Fix the HistoryServer view acls + Thomas Graves + 2014-04-24 18:38:10 -0700 + Commit: 44da5ab, github.com/apache/spark/pull/509 + + [SQL] Add support for parsing indexing into arrays in SQL. + Michael Armbrust + 2014-04-24 18:21:00 -0700 + Commit: 4660991, github.com/apache/spark/pull/518 + + [SPARK-1592][streaming] Automatically remove streaming input blocks + Tathagata Das + 2014-04-24 18:18:22 -0700 + Commit: 526a518, github.com/apache/spark/pull/512 + + SPARK-1438 RDD.sample() make seed param optional + Arun Ramakrishnan + 2014-04-24 17:27:16 -0700 + Commit: 35e3d19, github.com/apache/spark/pull/477 + + SPARK-1104: kill Process in workerThread of ExecutorRunner + CodingCat + 2014-04-24 15:55:18 -0700 + Commit: f99af85, github.com/apache/spark/pull/35 + + Fix Scala Style + Sandeep + 2014-04-24 15:07:23 -0700 + Commit: a03ac22, github.com/apache/spark/pull/531 + + SPARK-1494 Don't initialize classes loaded by MIMA excludes, attempt 2 + Michael Armbrust + 2014-04-24 14:54:01 -0700 + Commit: c5c1916, github.com/apache/spark/pull/526 + + Spark 1490 Add kerberos support to the HistoryServer + Thomas Graves + 2014-04-24 11:15:12 -0700 + Commit: bd37509, github.com/apache/spark/pull/513 + + SPARK-1611: Fix incorrect initialization order in AppendOnlyMap + zsxwing + 2014-04-24 11:13:40 -0700 + Commit: 78a49b2, github.com/apache/spark/pull/534 + + SPARK-1488. Squash more language feature warnings in new commits by importing implicitConversion + Sean Owen + 2014-04-24 10:06:18 -0700 + Commit: 6338a93, github.com/apache/spark/pull/528 + + Small changes to release script + Patrick Wendell + 2014-04-24 09:59:44 -0700 + Commit: faeb761 + + [SPARK-1610] [SQL] Fix Cast to use exact type value when cast from BooleanType to NumericTy... + Takuya UESHIN + 2014-04-24 09:57:28 -0700 + Commit: 27b2821, github.com/apache/spark/pull/533 + + SPARK-1601 & SPARK-1602: two bug fixes related to cancellation + Reynold Xin + 2014-04-24 00:27:45 -0700 + Commit: 1fdf659, github.com/apache/spark/pull/521 + + SPARK-1587 Fix thread leak + Mridul Muralidharan + 2014-04-23 23:20:55 -0700 + Commit: dd681f5, github.com/apache/spark/pull/504 + + [Fix #79] Replace Breakable For Loops By While Loops + Sandeep + 2014-04-23 22:47:59 -0700 + Commit: bb68f47, github.com/apache/spark/pull/503 + + SPARK-1589: Fix the incorrect compare + zsxwing + 2014-04-23 22:36:02 -0700 + Commit: 6ab7578, github.com/apache/spark/pull/508 + + Mark all fields of EdgePartition, Graph, and GraphOps transient + Ankur Dave + 2014-04-23 22:01:13 -0700 + Commit: 1d6abe3, github.com/apache/spark/pull/520 + + Update Java api for setJobGroup with interruptOnCancel + Aaron Davidson + 2014-04-23 22:00:22 -0700 + Commit: d485eec, github.com/apache/spark/pull/522 + + [Hot Fix #469] Fix flaky test in SparkListenerSuite + Andrew Or + 2014-04-23 21:59:33 -0700 + Commit: 4b2bab1, github.com/apache/spark/pull/516 + + [SPARK-1540] Add an optional Ordering parameter to PairRDDFunctions. + Matei Zaharia + 2014-04-23 17:03:54 -0700 + Commit: 640f9a0, github.com/apache/spark/pull/487 + + SPARK-1582 Invoke Thread.interrupt() when cancelling jobs + Aaron Davidson + 2014-04-23 16:52:49 -0700 + Commit: 432201c, github.com/apache/spark/pull/498 + + Honor default fs name when initializing event logger. + Marcelo Vanzin + 2014-04-23 14:47:38 -0700 + Commit: dd1b7a6, github.com/apache/spark/pull/450 + + SPARK-1572 Don't kill Executor if PythonRDD fails while computing parent + Aaron Davidson + 2014-04-23 14:46:30 -0700 + Commit: a967b00, github.com/apache/spark/pull/486 + + SPARK-1583: Fix a bug that using java.util.HashMap by mistake + zsxwing + 2014-04-23 14:12:20 -0700 + Commit: a664606, github.com/apache/spark/pull/500 + + SPARK-1119 and other build improvements + Patrick Wendell + 2014-04-23 10:19:32 -0700 + Commit: cd4ed29, github.com/apache/spark/pull/502 + + [SQL] SPARK-1571 Mistake in java example code + Michael Armbrust + 2014-04-22 22:19:32 -0700 + Commit: 39f85e0, github.com/apache/spark/pull/496 + + SPARK-1494 Don't initialize classes loaded by MIMA excludes. + Michael Armbrust + 2014-04-22 21:56:15 -0700 + Commit: 8e95081, github.com/apache/spark/pull/494 + + SPARK-1562 Fix visibility / annotation of Spark SQL APIs + Michael Armbrust + 2014-04-22 20:02:33 -0700 + Commit: aa77f8a, github.com/apache/spark/pull/489 + + [FIX: SPARK-1376] use --arg instead of --args in SparkSubmit to avoid warning messages + Xiangrui Meng + 2014-04-22 19:38:27 -0700 + Commit: 662c860, github.com/apache/spark/pull/485 + + [streaming][SPARK-1578] Removed requirement for TTL in StreamingContext. + Tathagata Das + 2014-04-22 19:35:13 -0700 + Commit: f3d19a9, github.com/apache/spark/pull/491 + + [Spark-1538] Fix SparkUI incorrectly hiding persisted RDDs + Andrew Or + 2014-04-22 19:24:03 -0700 + Commit: 2de5738, github.com/apache/spark/pull/469 + + Assorted clean-up for Spark-on-YARN. + Patrick Wendell + 2014-04-22 19:22:06 -0700 + Commit: 995fdc9, github.com/apache/spark/pull/488 + + [SPARK-1570] Fix classloading in JavaSQLContext.applySchema + Kan Zhang + 2014-04-22 15:05:12 -0700 + Commit: ea8cea8, github.com/apache/spark/pull/484 + + Fix compilation on Hadoop 2.4.x. + Marcelo Vanzin + 2014-04-22 14:28:41 -0700 + Commit: 0ea0b1a, github.com/apache/spark/pull/483 + + [Fix #204] Eliminate delay between binding and log checking + Andrew Or + 2014-04-22 14:27:49 -0700 + Commit: 745e496, github.com/apache/spark/pull/441 + + [SPARK-1506][MLLIB] Documentation improvements for MLlib 1.0 + Xiangrui Meng + 2014-04-22 11:20:47 -0700 + Commit: 26d35f3, github.com/apache/spark/pull/422 + + [SPARK-1281] Improve partitioning in ALS + Tor Myklebust + 2014-04-22 11:07:30 -0700 + Commit: bf9d49b, github.com/apache/spark/pull/407 + + fix bugs of dot in python + Xusen Yin + 2014-04-22 11:06:18 -0700 + Commit: c919798, github.com/apache/spark/pull/463 + + [SPARK-1560]: Updated Pyrolite Dependency to be Java 6 compatible + Ahir Reddy + 2014-04-22 09:44:41 -0700 + Commit: 0f87e6a, github.com/apache/spark/pull/479 + + [HOTFIX] SPARK-1399: remove outdated comments + CodingCat + 2014-04-22 09:43:13 -0700 + Commit: 87de290, github.com/apache/spark/pull/474 + + SPARK-1496: Have jarOfClass return Option[String] + Patrick Wendell + 2014-04-22 00:42:16 -0700 + Commit: 83084d3, github.com/apache/spark/pull/438 + + [SPARK-1459] Use local path (and not complete URL) when opening local lo... + Marcelo Vanzin + 2014-04-21 23:10:53 -0700 + Commit: ac164b7, github.com/apache/spark/pull/375 + + [Fix #274] Document + fix annotation usages + Andrew Or + 2014-04-21 22:24:44 -0700 + Commit: b3e5366, github.com/apache/spark/pull/470 + + [SPARK-1439, SPARK-1440] Generate unified Scaladoc across projects and Javadocs + Matei Zaharia + 2014-04-21 21:57:40 -0700 + Commit: fc78384, github.com/apache/spark/pull/457 + + [SPARK-1332] Improve Spark Streaming's Network Receiver and InputDStream API [WIP] + Tathagata Das + 2014-04-21 19:04:49 -0700 + Commit: 04c37b6, github.com/apache/spark/pull/300 + + Dev script: include RC name in git tag + Patrick Wendell + 2014-04-21 14:21:17 -0700 + Commit: 5a5b334 + + SPARK-1399: show stage failure reason in UI + CodingCat , Nan Zhu + 2014-04-21 14:10:23 -0700 + Commit: 43e4a29, github.com/apache/spark/pull/421 + + SPARK-1539: RDDPage.scala contains RddPage class + Xiangrui Meng + 2014-04-21 12:48:02 -0700 + Commit: b7df31e, github.com/apache/spark/pull/454 + + [Hot Fix] Ignore org.apache.spark.ui.UISuite tests + Andrew Or + 2014-04-21 12:37:43 -0700 + Commit: af46f1f, github.com/apache/spark/pull/466 + + Clean up and simplify Spark configuration + Patrick Wendell + 2014-04-21 10:26:33 -0700 + Commit: fb98488, github.com/apache/spark/pull/299 + + REPL cleanup. + Michael Armbrust + 2014-04-19 17:32:24 -0700 + Commit: 3a390bf, github.com/apache/spark/pull/451 + + [SPARK-1535] ALS: Avoid the garbage-creating ctor of DoubleMatrix + Tor Myklebust + 2014-04-19 15:10:18 -0700 + Commit: 25fc318, github.com/apache/spark/pull/442 + + Add insertInto and saveAsTable to Python API. + Michael Armbrust + 2014-04-19 15:08:54 -0700 + Commit: 10d0421, github.com/apache/spark/pull/447 + + Use scala deprecation instead of java. + Michael Armbrust + 2014-04-19 15:06:04 -0700 + Commit: 5d0f58b, github.com/apache/spark/pull/452 + + README update + Reynold Xin + 2014-04-18 22:34:39 -0700 + Commit: 28238c8, github.com/apache/spark/pull/443 + + SPARK-1482: Fix potential resource leaks in saveAsHadoopDataset and save... + zsxwing + 2014-04-18 17:49:22 -0700 + Commit: 2089e0e, github.com/apache/spark/pull/400 + + SPARK-1456 Remove view bounds on Ordered in favor of a context bound on Ordering. + Michael Armbrust + 2014-04-18 12:04:13 -0700 + Commit: c399baa, github.com/apache/spark/pull/410 + + Fixed broken pyspark shell. + Reynold Xin + 2014-04-18 10:10:13 -0700 + Commit: 81a152c, github.com/apache/spark/pull/444 + + SPARK-1523: improve the readability of code in AkkaUtil + CodingCat + 2014-04-18 10:05:00 -0700 + Commit: 3c7a9ba, github.com/apache/spark/pull/434 + + SPARK-1357 (addendum). More Experimental items in MLlib + Sean Owen + 2014-04-18 10:04:02 -0700 + Commit: 8aa1f4c, github.com/apache/spark/pull/372 + + [SPARK-1520] remove fastutil from dependencies + Xiangrui Meng + 2014-04-18 10:03:15 -0700 + Commit: aa17f02, github.com/apache/spark/pull/437 + + Reuses Row object in ExistingRdd.productToRowRdd() + Cheng Lian + 2014-04-18 10:02:27 -0700 + Commit: 89f4743, github.com/apache/spark/pull/432 + + SPARK-1483: Rename minSplits to minPartitions in public APIs + CodingCat + 2014-04-18 10:01:16 -0700 + Commit: e31c8ff, github.com/apache/spark/pull/430 + + HOTFIX: Ignore streaming UI test + Patrick Wendell + 2014-04-17 17:33:24 -0700 + Commit: 7863ecc, github.com/apache/spark/pull/440 + + FIX: Don't build Hive in assembly unless running Hive tests. + Patrick Wendell + 2014-04-17 17:24:00 -0700 + Commit: 6c746ba, github.com/apache/spark/pull/439 + + SPARK-1408 Modify Spark on Yarn to point to the history server when app ... + Thomas Graves + 2014-04-17 16:36:37 -0500 + Commit: 0058b5d, github.com/apache/spark/pull/362 + + [SPARK-1395] Allow "local:" URIs to work on Yarn. + Marcelo Vanzin + 2014-04-17 10:29:38 -0500 + Commit: 6904750, github.com/apache/spark/pull/303 + + [python alternative] pyspark require Python2, failing if system default is Py3 from shell.py + AbhishekKr + 2014-04-16 19:05:40 -0700 + Commit: bb76eae, github.com/apache/spark/pull/399 + + SPARK-1462: Examples of ML algorithms are using deprecated APIs + Sandeep + 2014-04-16 18:23:07 -0700 + Commit: 6ad4c54, github.com/apache/spark/pull/416 + + Include stack trace for exceptions thrown by user code. + Michael Armbrust + 2014-04-16 18:12:56 -0700 + Commit: d4916a8, github.com/apache/spark/pull/409 + + Update ReducedWindowedDStream.scala + baishuo(白硕) + 2014-04-16 18:08:11 -0700 + Commit: 07b7ad3, github.com/apache/spark/pull/425 + + misleading task number of groupByKey + Chen Chao + 2014-04-16 17:58:42 -0700 + Commit: 9c40b9e, github.com/apache/spark/pull/403 + + Fixing a race condition in event listener unit test + Kan Zhang + 2014-04-16 17:39:11 -0700 + Commit: 38877cc, github.com/apache/spark/pull/401 + + remove unnecessary brace and semicolon in 'putBlockInfo.synchronize' block + Chen Chao + 2014-04-16 17:30:01 -0700 + Commit: 016a877, github.com/apache/spark/pull/411 + + SPARK-1329: Create pid2vid with correct number of partitions + Ankur Dave + 2014-04-16 17:16:55 -0700 + Commit: 17d3234, github.com/apache/spark/pull/368 + + Rebuild routing table after Graph.reverse + Ankur Dave + 2014-04-16 17:15:50 -0700 + Commit: 235a47c, github.com/apache/spark/pull/431 + + Add clean to build + Patrick Wendell + 2014-04-16 16:32:34 -0700 + Commit: 987760e + + [SPARK-1511] use Files.move instead of renameTo in TestUtils.scala + Ye Xianjin + 2014-04-16 14:56:22 -0700 + Commit: 10b1c59, github.com/apache/spark/pull/427 + + SPARK-1465: Spark compilation is broken with the latest hadoop-2.4.0 release + xuan , xuan + 2014-04-16 14:41:22 -0500 + Commit: 725925c, github.com/apache/spark/pull/396 + + SPARK-1469: Scheduler mode should accept lower-case definitions and have... + Sandeep + 2014-04-16 09:58:57 -0700 + Commit: e269c24, github.com/apache/spark/pull/388 + + Minor addition to SPARK-1497 + Patrick Wendell + 2014-04-16 09:43:17 -0700 + Commit: 82349fb + + SPARK-1497. Fix scalastyle warnings in YARN, Hive code + Sean Owen + 2014-04-16 09:34:59 -0700 + Commit: 77f8367, github.com/apache/spark/pull/413 + + SPARK-1310: Start adding k-fold cross validation to MLLib [adds kFold to MLUtils & fixes bug in BernoulliSampler] + Holden Karau + 2014-04-16 09:33:27 -0700 + Commit: c3527a3, github.com/apache/spark/pull/18 + + update spark.default.parallelism + Chen Chao + 2014-04-16 09:14:18 -0700 + Commit: 9edd887, github.com/apache/spark/pull/389 + + Loads test tables when running "sbt hive/console" without HIVE_DEV_HOME + Cheng Lian + 2014-04-16 08:54:34 -0700 + Commit: fec462c, github.com/apache/spark/pull/417 + + Make "spark logo" link refer to "/". + Marcelo Vanzin + 2014-04-16 08:53:01 -0700 + Commit: c0273d8, github.com/apache/spark/pull/408 + + [SPARK-959] Updated SBT from 0.13.1 to 0.13.2 + Cheng Lian + 2014-04-16 08:52:14 -0700 + Commit: 6a10d80, github.com/apache/spark/pull/426 + + [SQL] SPARK-1424 Generalize insertIntoTable functions on SchemaRDDs + Michael Armbrust + 2014-04-15 20:40:40 -0700 + Commit: 273c2fd, github.com/apache/spark/pull/354 + + [WIP] SPARK-1430: Support sparse data in Python MLlib + Matei Zaharia + 2014-04-15 20:33:24 -0700 + Commit: 63ca581, github.com/apache/spark/pull/341 + + [FIX] update sbt-idea to version 1.6.0 + Xiangrui Meng + 2014-04-15 19:37:32 -0700 + Commit: 8517911, github.com/apache/spark/pull/419 + + SPARK-1455: Better isolation for unit tests. + Patrick Wendell + 2014-04-15 19:34:39 -0700 + Commit: 5aaf983, github.com/apache/spark/pull/420 + + Decision Tree documentation for MLlib programming guide + Manish Amde + 2014-04-15 11:14:28 -0700 + Commit: 07d72fe, github.com/apache/spark/pull/402 + + [SPARK-1157][MLlib] L-BFGS Optimizer based on Breeze's implementation. + DB Tsai + 2014-04-15 11:12:47 -0700 + Commit: 6843d63, github.com/apache/spark/pull/353 + + SPARK-1501: Ensure assertions in Graph.apply are asserted. + William Benton + 2014-04-15 10:38:42 -0700 + Commit: 2580a3b, github.com/apache/spark/pull/415 + + SPARK-1426: Make MLlib work with NumPy versions older than 1.7 + Sandeep + 2014-04-15 00:19:43 -0700 + Commit: df36091, github.com/apache/spark/pull/391 + + SPARK-1374: PySpark API for SparkSQL + Ahir Reddy , Michael Armbrust + 2014-04-15 00:07:55 -0700 + Commit: c99bcb7f, github.com/apache/spark/pull/363 + + SPARK-1488. Resolve scalac feature warnings during build + Sean Owen + 2014-04-14 19:50:00 -0700 + Commit: 0247b5c, github.com/apache/spark/pull/404 + + HOTFIX: Use file name and not paths for excludes + Patrick Wendell + 2014-04-14 15:51:54 -0700 + Commit: 268b535 + + [BUGFIX] In-memory columnar storage bug fixes + Cheng Lian , Michael Armbrust + 2014-04-14 15:22:43 -0700 + Commit: 7dbca68, github.com/apache/spark/pull/374 + + [SPARK-1415] Hadoop min split for wholeTextFiles() + Xusen Yin + 2014-04-13 13:18:52 -0700 + Commit: 037fe4d, github.com/apache/spark/pull/376 + + SPARK-1480: Clean up use of classloaders + Patrick Wendell + 2014-04-13 08:58:37 -0700 + Commit: 4bc07ee, github.com/apache/spark/pull/398 + + [SPARK-1403] Move the class loader creation back to where it was in 0.9.0 + Bharath Bhushan + 2014-04-12 20:52:29 -0700 + Commit: ca11919, github.com/apache/spark/pull/322 + + [Fix #204] Update out-dated comments + Andrew Or + 2014-04-12 16:33:38 -0700 + Commit: c2d160f, github.com/apache/spark/pull/381 + + [SPARK-1386] Web UI for Spark Streaming + Tathagata Das , Andrew Or + 2014-04-11 23:33:49 -0700 + Commit: 6aa08c3, github.com/apache/spark/pull/290 + + SPARK-1057 (alternative) Remove fastutil + Sean Owen + 2014-04-11 22:46:47 -0700 + Commit: 165e06a, github.com/apache/spark/pull/266 + + Update WindowedDStream.scala + baishuo(白硕) + 2014-04-11 20:33:42 -0700 + Commit: aa8bb11, github.com/apache/spark/pull/390 + + [WIP] [SPARK-1328] Add vector statistics + Xusen Yin , Xiangrui Meng + 2014-04-11 19:43:22 -0700 + Commit: fdfb45e, github.com/apache/spark/pull/268 + + [FIX] make coalesce test deterministic in RDDSuite + Xiangrui Meng + 2014-04-11 19:41:40 -0700 + Commit: 7038b00, github.com/apache/spark/pull/387 + + HOTFIX: Ignore python metastore files in RAT checks. + Patrick Wendell + 2014-04-11 13:23:21 -0700 + Commit: 6a0f8e3, github.com/apache/spark/pull/393 + + [SPARK-1225, 1241] [MLLIB] Add AreaUnderCurve and BinaryClassificationMetrics + Xiangrui Meng + 2014-04-11 12:06:13 -0700 + Commit: f5ace8d, github.com/apache/spark/pull/364 + + Some clean up in build/docs + Patrick Wendell + 2014-04-11 10:45:27 -0700 + Commit: 98225a6, github.com/apache/spark/pull/382 + + SPARK-1417: Spark on Yarn - spark UI link from resourcemanager is broken + Thomas Graves + 2014-04-11 13:17:48 +0530 + Commit: 446bb34, github.com/apache/spark/pull/344 + + SPARK-1202: Improvements to task killing in the UI. + Patrick Wendell + 2014-04-10 20:43:56 -0700 + Commit: 44f654e, github.com/apache/spark/pull/386 + + Add Spark v0.9.1 to ec2 launch script and use it as the default + Harvey Feng + 2014-04-10 18:25:54 -0700 + Commit: 7b4203a, github.com/apache/spark/pull/385 + + Set spark.executor.uri from environment variable (needed by Mesos) + Ivan Wick + 2014-04-10 17:49:30 -0700 + Commit: 5cd11d5, github.com/apache/spark/pull/311 + + SPARK-1202 - Add a "cancel" button in the UI for stages + Sundeep Narravula , Sundeep Narravula + 2014-04-10 17:10:11 -0700 + Commit: 2c55783, github.com/apache/spark/pull/246 + + [SQL] Improve column pruning in the optimizer. + Michael Armbrust + 2014-04-10 16:20:33 -0700 + Commit: f99401a, github.com/apache/spark/pull/378 + + Remove Unnecessary Whitespace's + Sandeep + 2014-04-10 15:04:13 -0700 + Commit: 930b70f, github.com/apache/spark/pull/380 + + Update tuning.md + Andrew Ash + 2014-04-10 14:59:58 -0700 + Commit: f046662, github.com/apache/spark/pull/384 + + Revert "SPARK-1433: Upgrade Mesos dependency to 0.17.0" + Patrick Wendell + 2014-04-10 14:43:29 -0700 + Commit: 7b52b66 + + SPARK-1428: MLlib should convert non-float64 NumPy arrays to float64 instead of complaining + Sandeep + 2014-04-10 11:17:41 -0700 + Commit: 3bd3129, github.com/apache/spark/pull/356 + + [SPARK-1276] Add a HistoryServer to render persisted UI + Andrew Or + 2014-04-10 10:39:34 -0700 + Commit: 79820fe, github.com/apache/spark/pull/204 + + +Release 1.0.0 + + HOTFIX: Add no-arg SparkContext constructor in Java + Patrick Wendell + 2014-05-25 20:13:32 -0700 + Commit: 18c77cb, github.com/apache/spark/pull/878 + + [SQL] Minor: Introduce SchemaRDD#aggregate() for simple aggregations + Aaron Davidson + 2014-05-25 18:37:44 -0700 + Commit: a3976a2, github.com/apache/spark/pull/874 + + SPARK-1903 Document Spark's network connections + Andrew Ash + 2014-05-25 17:15:47 -0700 + Commit: 5107a6f, github.com/apache/spark/pull/856 + + Fix PEP8 violations in Python mllib. + Reynold Xin + 2014-05-25 17:15:01 -0700 + Commit: 07f34ca, github.com/apache/spark/pull/871 + + Python docstring update for sql.py. + Reynold Xin + 2014-05-25 16:04:17 -0700 + Commit: 8891495, github.com/apache/spark/pull/869 + + Fix PEP8 violations in examples/src/main/python. + Reynold Xin + 2014-05-25 14:48:27 -0700 + Commit: 3368397, github.com/apache/spark/pull/870 + + Added license header for tox.ini. + Reynold Xin + 2014-05-25 01:47:08 -0700 + Commit: 7273bfc + + SPARK-1822: Some minor cleanup work on SchemaRDD.count() + Reynold Xin + 2014-05-25 01:44:49 -0700 + Commit: aeffc20, github.com/apache/spark/pull/868 + + Added PEP8 style configuration file. + Reynold Xin + 2014-05-25 01:32:15 -0700 + Commit: 291567d, github.com/apache/spark/pull/872 + + [SPARK-1822] SchemaRDD.count() should use query optimizer + Kan Zhang + 2014-05-25 00:06:42 -0700 + Commit: 64d0fb5, github.com/apache/spark/pull/841 + + spark-submit: add exec at the end of the script + Colin Patrick Mccabe + 2014-05-24 22:39:27 -0700 + Commit: 7e59335, github.com/apache/spark/pull/858 + + [SPARK-1886] check executor id existence when executor exit + Zhen Peng + 2014-05-24 20:40:19 -0700 + Commit: b5e9686, github.com/apache/spark/pull/827 + + Updated CHANGES.txt + Tathagata Das + 2014-05-25 02:20:13 +0000 + Commit: 8406092 + + SPARK-1911: Emphasize that Spark jars should be built with Java 6. + Patrick Wendell + 2014-05-24 18:27:00 -0700 + Commit: 217bd56, github.com/apache/spark/pull/859 + + [SPARK-1900 / 1918] PySpark on YARN is broken + Andrew Or + 2014-05-24 18:01:49 -0700 + Commit: 12f5ecc, github.com/apache/spark/pull/853 + + Update LBFGSSuite.scala + baishuo(白硕) + 2014-05-23 13:02:40 -0700 + Commit: 9be103a, github.com/apache/spark/pull/815 + + Updated scripts for auditing releases + Tathagata Das + 2014-05-22 20:48:55 -0700 + Commit: 6541ca2, github.com/apache/spark/pull/844 + + [SPARK-1896] Respect spark.master (and --master) before MASTER in spark-shell + Andrew Or + 2014-05-22 20:32:27 -0700 + Commit: c3b4065, github.com/apache/spark/pull/846 + + [SPARK-1897] Respect spark.jars (and --jars) in spark-shell + Andrew Or + 2014-05-22 20:25:41 -0700 + Commit: 23cc40e, github.com/apache/spark/pull/849 + + Fix UISuite unit test that fails under Jenkins contention + Aaron Davidson + 2014-05-22 15:11:05 -0700 + Commit: a566216, github.com/apache/spark/pull/857 + + [SPARK-1870] Make spark-submit --jars work in yarn-cluster mode. + Xiangrui Meng + 2014-05-22 01:52:50 -0700 + Commit: 79cd26c, github.com/apache/spark/pull/848 + + Configuration documentation updates + Reynold Xin + 2014-05-21 18:49:12 -0700 + Commit: 75af8bd, github.com/apache/spark/pull/851 + + [SPARK-1889] [SQL] Apply splitConjunctivePredicates to join condition while finding join ke... + Takuya UESHIN + 2014-05-21 15:37:47 -0700 + Commit: 6e7934e, github.com/apache/spark/pull/836 + + [SPARK-1519] Support minPartitions param of wholeTextFiles() in PySpark + Kan Zhang + 2014-05-21 13:26:53 -0700 + Commit: 30d1df5, github.com/apache/spark/pull/697 + + [Typo] Stoped -> Stopped + Andrew Or + 2014-05-21 11:59:05 -0700 + Commit: 9b8f772, github.com/apache/spark/pull/847 + + [Minor] Move JdbcRDDSuite to the correct package + Andrew Or + 2014-05-21 01:25:10 -0700 + Commit: bc6bbfa, github.com/apache/spark/pull/839 + + [Docs] Correct example of creating a new SparkConf + Andrew Or + 2014-05-21 01:23:34 -0700 + Commit: 7295dd9, github.com/apache/spark/pull/842 + + [SPARK-1250] Fixed misleading comments in bin/pyspark, bin/spark-class + Sumedh Mungee + 2014-05-21 01:22:25 -0700 + Commit: 364c14a, github.com/apache/spark/pull/843 + + [Hotfix] Blacklisted flaky HiveCompatibility test + Tathagata Das + 2014-05-20 10:27:12 -0700 + Commit: b4d93d3, github.com/apache/spark/pull/838 + + Updated CHANGES.txt + Tathagata Das + 2014-05-19 23:12:24 -0700 + Commit: 1c00f2a + + [Spark 1877] ClassNotFoundException when loading RDD with serialized objects + Tathagata Das , Ghidireac + 2014-05-19 22:36:24 -0700 + Commit: 6cbe2a3, github.com/apache/spark/pull/835 + + [SPARK-1874][MLLIB] Clean up MLlib sample data + Xiangrui Meng + 2014-05-19 21:29:33 -0700 + Commit: 1c6c8b5, github.com/apache/spark/pull/833 + + SPARK-1689: Spark application should die when removed by Master + Aaron Davidson + 2014-05-19 20:55:26 -0700 + Commit: 78b6e6f, github.com/apache/spark/pull/832 + + [SPARK-1875]NoClassDefFoundError: StringUtils when building with hadoop 1.x and hive + witgo + 2014-05-19 19:40:29 -0700 + Commit: 875c54f, github.com/apache/spark/pull/824 + + SPARK-1879. Increase MaxPermSize since some of our builds have many classes + Matei Zaharia + 2014-05-19 18:42:28 -0700 + Commit: 00563e1, github.com/apache/spark/pull/823 + + SPARK-1878: Fix the incorrect initialization order + zsxwing + 2014-05-19 16:41:31 -0700 + Commit: 901102c, github.com/apache/spark/pull/822 + + [SPARK-1876] Windows fixes to deal with latest distribution layout changes + Matei Zaharia + 2014-05-19 15:02:35 -0700 + Commit: 111c121, github.com/apache/spark/pull/819 + + [WIP][SPARK-1871][MLLIB] Improve MLlib guide for v1.0 + Xiangrui Meng + 2014-05-18 17:00:57 -0700 + Commit: ecab8a2, github.com/apache/spark/pull/816 + + SPARK-1873: Add README.md file when making distributions + Patrick Wendell + 2014-05-18 16:51:53 -0700 + Commit: 8e8b351, github.com/apache/spark/pull/818 + + Fix spark-submit path in spark-shell & pyspark + Neville Li + 2014-05-18 13:31:23 -0700 + Commit: e06e4b0, github.com/apache/spark/pull/812 + + Make deprecation warning less severe + Patrick Wendell + 2014-05-16 22:58:47 -0700 + Commit: 3b3d7c8, github.com/apache/spark/pull/810 + + [SPARK-1824] Remove from Python examples + Andrew Or + 2014-05-16 22:36:23 -0700 + Commit: 03b4242, github.com/apache/spark/pull/802 + + [SPARK-1808] Route bin/pyspark through Spark submit + Andrew Or + 2014-05-16 22:34:38 -0700 + Commit: 318739a, github.com/apache/spark/pull/799 + + Version bump of spark-ec2 scripts + Patrick Wendell + 2014-05-16 21:42:14 -0700 + Commit: 9cd12f3, github.com/apache/spark/pull/809 + + SPARK-1864 Look in spark conf instead of system properties when propagating configuration to executors. + Michael Armbrust + 2014-05-16 20:25:10 -0700 + Commit: a16a19f, github.com/apache/spark/pull/808 + + Tweaks to Mesos docs + Matei Zaharia + 2014-05-16 17:35:05 -0700 + Commit: 2ba6711, github.com/apache/spark/pull/806 + + [SQL] Implement between in hql + Michael Armbrust + 2014-05-16 11:47:00 -0700 + Commit: 386b31c, github.com/apache/spark/pull/804 + + bugfix: overflow of graphx Edge compare function + Zhen Peng + 2014-05-16 11:37:18 -0700 + Commit: ff47cdc, github.com/apache/spark/pull/769 + + SPARK-1862: Support for MapR in the Maven build. + Patrick Wendell + 2014-05-15 23:31:43 -0700 + Commit: eec4dd8, github.com/apache/spark/pull/803 + + [Spark-1461] Deferred Expression Evaluation (short-circuit evaluation) + Cheng Hao + 2014-05-15 22:12:34 -0700 + Commit: eac4ee8, github.com/apache/spark/pull/446 + + SPARK-1860: Do not cleanup application work/ directories by default + Aaron Davidson + 2014-05-15 21:37:58 -0700 + Commit: 5441471, github.com/apache/spark/pull/800 + + Typos in Spark + Huajian Mao + 2014-05-15 18:20:16 -0700 + Commit: a2742d8, github.com/apache/spark/pull/798 + + Fixes a misplaced comment. + Prashant Sharma + 2014-05-15 16:58:37 -0700 + Commit: 2e418f5, github.com/apache/spark/pull/788 + + [SQL] Fix tiny/small ints from HiveMetastore. + Michael Armbrust + 2014-05-15 16:50:42 -0700 + Commit: ffa9c49, github.com/apache/spark/pull/797 + + SPARK-1803 Replaced colon in filenames with a dash + Stevo Slavić , Stevo Slavic + 2014-05-15 16:44:14 -0700 + Commit: 22f261a, github.com/apache/spark/pull/739 + + SPARK-1851. Upgrade Avro dependency to 1.7.6 so Spark can read Avro file... + Sandy Ryza + 2014-05-15 16:35:39 -0700 + Commit: 3587057, github.com/apache/spark/pull/795 + + [SPARK-1741][MLLIB] add predict(JavaRDD) to RegressionModel, ClassificationModel, and KMeans + Xiangrui Meng + 2014-05-15 11:59:59 -0700 + Commit: bc9a96e, github.com/apache/spark/pull/670 + + [SPARK-1819] [SQL] Fix GetField.nullable. + Takuya UESHIN + 2014-05-15 11:21:33 -0700 + Commit: f9eeddc, github.com/apache/spark/pull/757 + + [SPARK-1845] [SQL] Use AllScalaRegistrar for SparkSqlSerializer to register serializers of ... + Takuya UESHIN + 2014-05-15 11:20:21 -0700 + Commit: 7515367, github.com/apache/spark/pull/790 + + SPARK-1846 Ignore logs directory in RAT checks + Andrew Ash + 2014-05-15 11:05:39 -0700 + Commit: aa5f989, github.com/apache/spark/pull/793 + + HOTFIX: Don't build Javadoc in Maven when creating releases. + Patrick Wendell + 2014-05-14 23:48:03 -0700 + Commit: 88f1da3 + + fix different versions of commons-lang dependency and apache/spark#746 addendum + witgo + 2014-05-14 22:26:26 -0700 + Commit: 31b853c, github.com/apache/spark/pull/754 + + Package docs + Prashant Sharma , Patrick Wendell + 2014-05-14 22:24:41 -0700 + Commit: c02d614, github.com/apache/spark/pull/785 + + Documentation: Encourage use of reduceByKey instead of groupByKey. + Patrick Wendell + 2014-05-14 22:24:04 -0700 + Commit: f2faa37, github.com/apache/spark/pull/784 + + Add language tabs and Python version to interactive part of quick-start + Matei Zaharia + 2014-05-14 21:45:20 -0700 + Commit: 976784b, github.com/apache/spark/pull/782 + + [SPARK-1840] SparkListenerBus prints out scary error message when terminated normally + Tathagata Das + 2014-05-14 21:13:41 -0700 + Commit: ba87123, github.com/apache/spark/pull/783 + + default task number misleading in several places + Chen Chao + 2014-05-14 18:20:20 -0700 + Commit: 9f0f2ec, github.com/apache/spark/pull/766 + + [SPARK-1826] fix the head notation of package object dsl + wangfei + 2014-05-14 17:59:11 -0700 + Commit: fdf9717, github.com/apache/spark/pull/765 + + [Typo] propertes -> properties + andrewor14 + 2014-05-14 17:54:53 -0700 + Commit: 5ca3096, github.com/apache/spark/pull/780 + + [SPARK-1696][MLLIB] use alpha in dense dspr + Xiangrui Meng + 2014-05-14 17:18:30 -0700 + Commit: d6f1a75, github.com/apache/spark/pull/778 + + [FIX] do not load defaults when testing SparkConf in pyspark + Xiangrui Meng + 2014-05-14 14:57:17 -0700 + Commit: 31faec7, github.com/apache/spark/pull/775 + + SPARK-1833 - Have an empty SparkContext constructor. + Patrick Wendell + 2014-05-14 12:53:30 -0700 + Commit: 8e13ab2, github.com/apache/spark/pull/774 + + SPARK-1829 Sub-second durations shouldn't round to "0 s" + Andrew Ash + 2014-05-14 12:01:14 -0700 + Commit: 530bdf7, github.com/apache/spark/pull/768 + + Fix: sbt test throw an java.lang.OutOfMemoryError: PermGen space + witgo + 2014-05-14 11:19:26 -0700 + Commit: 379f733, github.com/apache/spark/pull/773 + + Adding back hive support + Patrick Wendell + 2014-05-14 10:21:27 -0700 + Commit: e8ca397 + + [SPARK-1620] Handle uncaught exceptions in function run by Akka scheduler + Mark Hamstra + 2014-05-14 10:07:25 -0700 + Commit: 9ff9078, github.com/apache/spark/pull/622 + + SPARK-1828: Created forked version of hive-exec that doesn't bundle other dependencies + Patrick Wendell + 2014-05-14 09:51:01 -0700 + Commit: 34f6fa9, github.com/apache/spark/pull/767 + + SPARK-1818 Freshen Mesos documentation + Andrew Ash + 2014-05-14 09:45:33 -0700 + Commit: fc6b652, github.com/apache/spark/pull/756 + + SPARK-1827. LICENSE and NOTICE files need a refresh to contain transitive dependency info + Sean Owen + 2014-05-14 09:38:33 -0700 + Commit: 7083282, github.com/apache/spark/pull/770 + + Fixed streaming examples docs to use run-example instead of spark-submit + Tathagata Das + 2014-05-14 04:17:32 -0700 + Commit: c7571d8, github.com/apache/spark/pull/722 + + [SPARK-1769] Executor loss causes NPE race condition + Andrew Or + 2014-05-14 00:54:33 -0700 + Commit: 69ec314, github.com/apache/spark/pull/762 + + Fix dep exclusion: avro-ipc, not avro, depends on netty. + Marcelo Vanzin + 2014-05-14 00:37:57 -0700 + Commit: b3d9878, github.com/apache/spark/pull/763 + + SPARK-1801. expose InterruptibleIterator and TaskKilledException in deve... + Koert Kuipers + 2014-05-14 00:10:12 -0700 + Commit: 7da80a3, github.com/apache/spark/pull/764 + + [SQL] Improve column pruning. + Michael Armbrust + 2014-05-13 23:27:22 -0700 + Commit: f66f766, github.com/apache/spark/pull/729 + + Revert "[SPARK-1784] Add a new partitioner to allow specifying # of keys per partition" + Patrick Wendell + 2014-05-13 23:25:19 -0700 + Commit: 721194b + + Implement ApproximateCountDistinct for SparkSql + larvaboy + 2014-05-13 21:26:08 -0700 + Commit: 92b0ec9, github.com/apache/spark/pull/737 + + [SPARK-1784] Add a new partitioner to allow specifying # of keys per partition + Syed Hashmi + 2014-05-13 21:24:23 -0700 + Commit: 66fe479, github.com/apache/spark/pull/721 + + [SQL] Make it possible to create Java/Python SQLContexts from an existing Scala SQLContext. + Michael Armbrust + 2014-05-13 21:23:51 -0700 + Commit: 618b3e6, github.com/apache/spark/pull/761 + + [SPARK-1527] change rootDir*.getName to rootDir*.getAbsolutePath + Ye Xianjin + 2014-05-13 19:03:51 -0700 + Commit: ef5e9d7, github.com/apache/spark/pull/436 + + [SPARK-1816] LiveListenerBus dies if a listener throws an exception + Andrew Or + 2014-05-13 18:32:32 -0700 + Commit: 3892ec5, github.com/apache/spark/pull/759 + + SPARK-1791 - SVM implementation does not use threshold parameter + Andrew Tulloch + 2014-05-13 17:31:27 -0700 + Commit: d6994f4, github.com/apache/spark/pull/725 + + BUILD: Add more content to make-distribution.sh. + Patrick Wendell + 2014-05-12 23:02:54 -0700 + Commit: 716462c + + Adding CHANGES.txt file and removing YARN support for now + Patrick Wendell + 2014-05-12 20:21:23 -0700 + Commit: fa2d4d8 + + SPARK-1815. SparkContext should not be marked DeveloperApi + Sandy Ryza + 2014-05-12 20:08:30 -0700 + Commit: 31d54c0, github.com/apache/spark/pull/753 + + [SPARK-1753 / 1773 / 1814] Update outdated docs for spark-submit, YARN, standalone etc. + Andrew Or + 2014-05-12 19:44:14 -0700 + Commit: b9e41f4, github.com/apache/spark/pull/701 + + [SPARK-1780] Non-existent SPARK_DAEMON_OPTS is lurking around + Andrew Or + 2014-05-12 19:42:35 -0700 + Commit: 5ef24a0, github.com/apache/spark/pull/751 + + SPARK-1757 Failing test for saving null primitives with .saveAsParquetFile() + Andrew Ash , Michael Armbrust + 2014-05-12 19:23:39 -0700 + Commit: b52ac0e, github.com/apache/spark/pull/690 + + Modify a typo in monitoring.md + Kousuke Saruta + 2014-05-12 19:21:06 -0700 + Commit: 89b56d7, github.com/apache/spark/pull/698 + + L-BFGS Documentation + DB Tsai + 2014-05-12 19:20:24 -0700 + Commit: bad4c9d, github.com/apache/spark/pull/702 + + Typo: resond -> respond + Andrew Ash + 2014-05-12 18:46:28 -0700 + Commit: 1fbebca, github.com/apache/spark/pull/743 + + [SQL] Make Hive Metastore conversion functions publicly visible. + Michael Armbrust + 2014-05-12 18:40:30 -0700 + Commit: 24cc933, github.com/apache/spark/pull/750 + + [SPARK-1736] Spark submit for Windows + Andrew Or + 2014-05-12 17:39:40 -0700 + Commit: 59695b3, github.com/apache/spark/pull/745 + + SPARK-1802. (Addendium) Audit dependency graph when Spark is built with -Pyarn + Sean Owen + 2014-05-12 17:35:29 -0700 + Commit: 02caa7e, github.com/apache/spark/pull/746 + + SPARK-1623: Use File objects instead of String's in HTTPBroadcast + Patrick Wendell + 2014-05-12 17:27:28 -0700 + Commit: c294f37, github.com/apache/spark/pull/749 + + Rename testExecutorEnvs --> executorEnvs. + Patrick Wendell + 2014-05-12 17:09:13 -0700 + Commit: e9d602d, github.com/apache/spark/pull/747 + + Adding hadoop-2.2 profile to the build + Patrick Wendell + 2014-05-12 15:40:48 -0700 + Commit: b66051e + + Rollback versions for 1.0.0-rc4 + Patrick Wendell + 2014-05-12 15:23:53 -0700 + Commit: 51142b7 + + SPARK-1802. Audit dependency graph when Spark is built with -Phive + Sean Owen + 2014-05-12 14:17:25 -0700 + Commit: e185281, github.com/apache/spark/pull/744 + + SPARK-1798. Tests should clean up temp files + Sean Owen + 2014-05-12 14:16:19 -0700 + Commit: 14515b4, github.com/apache/spark/pull/732 + + BUILD: Include Hive with default packages when creating a release + Patrick Wendell + 2014-05-12 13:20:23 -0700 + Commit: 722ecaa + + SPARK-1786: Reopening PR 724 + Ankur Dave , Joseph E. Gonzalez + 2014-05-12 13:05:24 -0700 + Commit: 642ad49, github.com/apache/spark/pull/742 + + SPARK-1806: Upgrade Mesos dependency to 0.18.1 + Bernardo Gomez Palacio + 2014-05-12 11:10:28 -0700 + Commit: 0be8b45, github.com/apache/spark/pull/741 + + SPARK-1772 Stop catching Throwable, let Executors die + Aaron Davidson + 2014-05-12 11:08:52 -0700 + Commit: c88adbb, github.com/apache/spark/pull/715 + + Revert "SPARK-1786: Edge Partition Serialization" + Patrick Wendell + 2014-05-12 10:51:01 -0700 + Commit: 19ccf20 + + SPARK-1786: Edge Partition Serialization + Ankur Dave , Joseph E. Gonzalez + 2014-05-11 19:20:42 -0700 + Commit: 09e7aa4, github.com/apache/spark/pull/724 + + Fix error in 2d Graph Partitioner + Joseph E. Gonzalez + 2014-05-11 18:33:46 -0700 + Commit: f84b798, github.com/apache/spark/pull/709 + + SPARK-1652: Set driver memory correctly in spark-submit. + Patrick Wendell + 2014-05-11 18:17:34 -0700 + Commit: 2eea663, github.com/apache/spark/pull/730 + + SPARK-1770: Load balance elements when repartitioning. + Patrick Wendell + 2014-05-11 17:11:55 -0700 + Commit: 5d69699, github.com/apache/spark/pull/727 + + remove outdated runtime Information scala home + witgo + 2014-05-11 14:34:27 -0700 + Commit: 8097bb2, github.com/apache/spark/pull/728 + + Revert "Enabled incremental build that comes with sbt 0.13.2" + Patrick Wendell + 2014-05-10 21:08:53 -0700 + Commit: 758e543 + + Enabled incremental build that comes with sbt 0.13.2 + Prashant Sharma + 2014-05-10 21:08:04 -0700 + Commit: 71ce7eb, github.com/apache/spark/pull/525 + + [SPARK-1774] Respect SparkSubmit --jars on YARN (client) + Andrew Or + 2014-05-10 20:58:02 -0700 + Commit: 012f904, github.com/apache/spark/pull/710 + + SPARK-1789. Multiple versions of Netty dependencies cause FlumeStreamSuite failure + Sean Owen + 2014-05-10 20:50:40 -0700 + Commit: c7253da, github.com/apache/spark/pull/723 + + Unify GraphImpl RDDs + other graph load optimizations + Ankur Dave + 2014-05-10 14:48:07 -0700 + Commit: 4e9a0cb, github.com/apache/spark/pull/497 + + [SPARK-1690] Tolerating empty elements when saving Python RDD to text files + Kan Zhang + 2014-05-10 14:01:08 -0700 + Commit: ac86af8, github.com/apache/spark/pull/644 + + Add Python includes to path before depickling broadcast values + Bouke van der Bijl + 2014-05-10 13:02:13 -0700 + Commit: 2a669a7, github.com/apache/spark/pull/656 + + fix broken in link in python docs + Andy Konwinski + 2014-05-10 12:46:51 -0700 + Commit: 71ad53f, github.com/apache/spark/pull/650 + + SPARK-1708. Add a ClassTag on Serializer and things that depend on it + Matei Zaharia + 2014-05-10 12:10:24 -0700 + Commit: 9fbb22c, github.com/apache/spark/pull/700 + + [SPARK-1778] [SQL] Add 'limit' transformation to SchemaRDD. + Takuya UESHIN + 2014-05-10 12:03:27 -0700 + Commit: 7486474, github.com/apache/spark/pull/711 + + [SQL] Upgrade parquet library. + Michael Armbrust + 2014-05-10 11:48:01 -0700 + Commit: a61b71c, github.com/apache/spark/pull/684 + + [SPARK-1644] The org.datanucleus:* should not be packaged into spark-assembly-*.jar + witgo + 2014-05-10 10:15:04 -0700 + Commit: 2a878da, github.com/apache/spark/pull/688 + + SPARK-1686: keep schedule() calling in the main thread + CodingCat + 2014-05-09 21:50:23 -0700 + Commit: adf8cdd, github.com/apache/spark/pull/639 + + SPARK-1770: Revert accidental(?) fix + Aaron Davidson + 2014-05-09 14:51:34 -0700 + Commit: 8202276, github.com/apache/spark/pull/716 + + [SPARK-1760]: fix building spark with maven documentation + witgo + 2014-05-09 01:51:26 -0700 + Commit: 80f292a, github.com/apache/spark/pull/712 + + Converted bang to ask to avoid scary warning when a block is removed + Tathagata Das + 2014-05-08 22:34:08 -0700 + Commit: b8c17e3, github.com/apache/spark/pull/708 + + MINOR: Removing dead code. + Patrick Wendell + 2014-05-08 22:33:06 -0700 + Commit: 1d56cd5 + + SPARK-1775: Unneeded lock in ShuffleMapTask.deserializeInfo + Sandeep + 2014-05-08 22:30:17 -0700 + Commit: 5c8e8de, github.com/apache/spark/pull/707 + + SPARK-1565 (Addendum): Replace `run-example` with `spark-submit`. + Patrick Wendell + 2014-05-08 22:26:17 -0700 + Commit: f6323eb, github.com/apache/spark/pull/704 + + [SPARK-1631] Correctly set the Yarn app name when launching the AM. + Marcelo Vanzin + 2014-05-08 20:46:11 -0700 + Commit: 7e19334, github.com/apache/spark/pull/539 + + [SPARK-1755] Respect SparkSubmit --name on YARN + Andrew Or + 2014-05-08 20:45:29 -0700 + Commit: 666bebe, github.com/apache/spark/pull/699 + + Include the sbin/spark-config.sh in spark-executor + Bouke van der Bijl + 2014-05-08 20:43:37 -0700 + Commit: ab91227, github.com/apache/spark/pull/651 + + Bug fix of sparse vector conversion + Funes , funes + 2014-05-08 17:54:10 -0700 + Commit: 9ed17ff, github.com/apache/spark/pull/661 + + [SPARK-1157][MLlib] Bug fix: lossHistory should exclude rejection steps, and remove miniBatch + DB Tsai + 2014-05-08 17:53:22 -0700 + Commit: 3452997, github.com/apache/spark/pull/582 + + MLlib documentation fix + DB Tsai + 2014-05-08 17:52:32 -0700 + Commit: d81d626, github.com/apache/spark/pull/703 + + Fixing typo in als.py + Evan Sparks + 2014-05-08 13:07:30 -0700 + Commit: 98944a9, github.com/apache/spark/pull/696 + + [SPARK-1754] [SQL] Add missing arithmetic DSL operations. + Takuya UESHIN + 2014-05-08 15:31:47 -0700 + Commit: 6f701ff, github.com/apache/spark/pull/689 + + [SPARK-1745] Move interrupted flag from TaskContext constructor (minor) + Andrew Or + 2014-05-08 12:13:07 -0700 + Commit: ee63321, github.com/apache/spark/pull/675 + + SPARK-1565, update examples to be used with spark-submit script. + Prashant Sharma + 2014-05-08 10:23:05 -0700 + Commit: 30cfa8d, github.com/apache/spark/pull/552 + + [SQL] Improve SparkSQL Aggregates + Michael Armbrust + 2014-05-08 01:08:43 -0400 + Commit: 8f3b925, github.com/apache/spark/pull/683 + + Use numpy directly for matrix multiply. + Evan Sparks + 2014-05-08 00:24:36 -0400 + Commit: 010040f, github.com/apache/spark/pull/687 + + SPARK-1668: Add implicit preference as an option to examples/MovieLensALS + Sandeep + 2014-05-08 00:15:05 -0400 + Commit: 35aa244, github.com/apache/spark/pull/597 + + SPARK-1544 Add support for deep decision trees. + Manish Amde , manishamde , Evan Sparks + 2014-05-07 17:08:38 -0700 + Commit: c7b2704, github.com/apache/spark/pull/475 + + Update GradientDescentSuite.scala + baishuo(白硕) + 2014-05-07 16:02:55 -0700 + Commit: 0972b62, github.com/apache/spark/pull/588 + + [SPARK-1743][MLLIB] add loadLibSVMFile and saveAsLibSVMFile to pyspark + Xiangrui Meng + 2014-05-07 16:01:11 -0700 + Commit: bb90e87, github.com/apache/spark/pull/672 + + SPARK-1569 Spark on Yarn, authentication broken by pr299 + Thomas Graves + 2014-05-07 15:51:53 -0700 + Commit: 879eeee, github.com/apache/spark/pull/649 + + [SPARK-1688] Propagate PySpark worker stderr to driver + Andrew Or + 2014-05-07 14:35:22 -0700 + Commit: 82c8e89, github.com/apache/spark/pull/603 + + Typo fix: fetchting -> fetching + Andrew Ash + 2014-05-07 17:24:49 -0400 + Commit: 0759ee7, github.com/apache/spark/pull/680 + + Nicer logging for SecurityManager startup + Andrew Ash + 2014-05-07 17:24:12 -0400 + Commit: 69e2726, github.com/apache/spark/pull/678 + + [SQL] Fix Performance Issue in data type casting + Cheng Hao + 2014-05-07 16:54:58 -0400 + Commit: 82ceda2, github.com/apache/spark/pull/679 + + SPARK-1579: Clean up PythonRDD and avoid swallowing IOExceptions + Aaron Davidson + 2014-05-07 09:48:31 -0700 + Commit: 18caa8c, github.com/apache/spark/pull/640 + + [SPARK-1460] Returning SchemaRDD instead of normal RDD on Set operations... + Kan Zhang + 2014-05-07 09:41:31 -0700 + Commit: da9f9e0, github.com/apache/spark/pull/448 + + [WIP][Spark-SQL] Optimize the Constant Folding for Expression + Cheng Hao , Michael Armbrust + 2014-05-07 03:37:12 -0400 + Commit: 756c969, github.com/apache/spark/pull/482 + + SPARK-1746: Support setting SPARK_JAVA_OPTS on executors for backwards compatibility + Patrick Wendell + 2014-05-07 00:11:05 -0700 + Commit: 00fac73, github.com/apache/spark/pull/676 + + [HOTFIX] SPARK-1637: There are some Streaming examples added after the PR #571 was last updated. + Sandeep + 2014-05-06 21:55:05 -0700 + Commit: ade4756, github.com/apache/spark/pull/673 + + Proposal: clarify Scala programming guide on caching ... + Ethan Jewett + 2014-05-06 20:50:08 -0700 + Commit: 51e2775, github.com/apache/spark/pull/668 + + SPARK-1727. Correct small compile errors, typos, and markdown issues in (primarly) MLlib docs + Sean Owen + 2014-05-06 20:07:22 -0700 + Commit: 514ee93, github.com/apache/spark/pull/653 + + SPARK-1637: Clean up examples for 1.0 + Sandeep + 2014-05-06 17:27:52 -0700 + Commit: 8cfebf5, github.com/apache/spark/pull/571 + + SPARK-1737: Warn rather than fail when Java 7+ is used to create distributions + Patrick Wendell + 2014-05-06 15:41:46 -0700 + Commit: d8f1b33, github.com/apache/spark/pull/669 + + [SPARK-1549] Add Python support to spark-submit + Matei Zaharia + 2014-05-06 15:12:35 -0700 + Commit: d7ddb26, github.com/apache/spark/pull/664 + + SPARK-1734: spark-submit throws an exception: Exception in thread "main"... + witgo + 2014-05-06 14:17:39 -0700 + Commit: 48cc9a9, github.com/apache/spark/pull/665 + + [SPARK-1685] Cancel retryTimer on restart of Worker or AppClient + Mark Hamstra + 2014-05-06 12:53:39 -0700 + Commit: 0aaa2c6, github.com/apache/spark/pull/602 + + Fix two download suggestions in the docs: + Patrick Wendell + 2014-05-06 12:07:46 -0700 + Commit: 1083f2b, github.com/apache/spark/pull/662 + + SPARK-1474: Spark on yarn assembly doesn't include AmIpFilter + Thomas Graves + 2014-05-06 12:00:09 -0700 + Commit: 0c3e415, github.com/apache/spark/pull/406 + + Update OpenHashSet.scala + ArcherShao + 2014-05-06 10:12:59 -0700 + Commit: 4ff3929, github.com/apache/spark/pull/667 + + [SQL] SPARK-1732 - Support for null primitive values. + Michael Armbrust + 2014-05-05 22:59:42 -0700 + Commit: 39ac62d, github.com/apache/spark/pull/658 + + [SPARK-1735] Add the missing special profiles to make-distribution.sh + Andrew Or + 2014-05-05 22:14:47 -0700 + Commit: 4708eff, github.com/apache/spark/pull/660 + + [SPARK-1678][SPARK-1679] In-memory compression bug fix and made compression configurable, disabled by default + Cheng Lian + 2014-05-05 19:38:59 -0700 + Commit: 2853e56, github.com/apache/spark/pull/608 + + [SPARK-1594][MLLIB] Cleaning up MLlib APIs and guide + Xiangrui Meng + 2014-05-05 18:32:54 -0700 + Commit: 32c960a, github.com/apache/spark/pull/524 + + Expose SparkListeners and relevant classes as DeveloperApi + Andrew Or + 2014-05-05 18:32:14 -0700 + Commit: a5f765c, github.com/apache/spark/pull/648 + + SPARK-1728. JavaRDDLike.mapPartitionsWithIndex requires ClassTag + Sandy Ryza + 2014-05-05 18:26:34 -0700 + Commit: 01e3ff0, github.com/apache/spark/pull/657 + + [SPARK-1681] Include datanucleus jars in Spark Hive distribution + Andrew Or + 2014-05-05 16:28:07 -0700 + Commit: 4d0dd50, github.com/apache/spark/pull/610 + + [SPARK-1504], [SPARK-1505], [SPARK-1558] Updated Spark Streaming guide + Tathagata Das + 2014-05-05 15:28:19 -0700 + Commit: 1fac4ec, github.com/apache/spark/pull/652 + + SPARK-1721: Reset the thread classLoader in the Mesos Executor + Bouke van der Bijl + 2014-05-05 11:19:35 -0700 + Commit: 80f4360, github.com/apache/spark/pull/620 + + SPARK-1556. jets3t dep doesn't update properly with newer Hadoop versions + Sean Owen + 2014-05-05 10:33:49 -0700 + Commit: 5d72283, github.com/apache/spark/pull/629 + + Updated doc for spark.closure.serializer to indicate only Java serializer work. + Reynold Xin + 2014-05-05 00:52:06 -0700 + Commit: 6be7226, github.com/apache/spark/pull/642 + + Address SPARK-1717 + msiddalingaiah + 2014-05-04 21:59:10 -0700 + Commit: b5c62c8, github.com/apache/spark/pull/641 + + SPARK-1710: spark-submit should print better errors than "InvocationTargetException" + Sandeep + 2014-05-04 20:51:53 -0700 + Commit: afcb9ae, github.com/apache/spark/pull/630 + + EC2 script should exit with non-zero code on UsageError + Allan Douglas R. de Oliveira + 2014-05-04 20:36:51 -0700 + Commit: 7305278, github.com/apache/spark/pull/638 + + SPARK-1693: Most of the tests throw a java.lang.SecurityException when s... + witgo + 2014-05-04 17:48:52 -0700 + Commit: ec0bce1, github.com/apache/spark/pull/628 + + SPARK-1629. Addendum: Depend on commons lang3 (already used by tachyon) as it's used in ReplSuite, and return to use lang3 utility in Utils.scala + Sean Owen + 2014-05-04 17:43:28 -0700 + Commit: 4505bc2, github.com/apache/spark/pull/635 + + SPARK-1703 Warn users if Spark is run on JRE6 but compiled with JDK7. + Patrick Wendell + 2014-05-04 12:22:23 -0700 + Commit: 2f091d5, github.com/apache/spark/pull/627 + + SPARK-1663. (Addendum) Fix signature of one version of JavaPairRDDStream.reduceByKeyAndWindow() + Sean Owen + 2014-05-04 11:55:29 -0700 + Commit: 40d05a4, github.com/apache/spark/pull/633 + + SPARK-1658: Correctly identify if maven is installed and working + Rahul Singhal + 2014-05-04 11:08:39 -0700 + Commit: 2ee5f04, github.com/apache/spark/pull/580 + + The default version of yarn is equal to the hadoop version + witgo + 2014-05-03 23:32:12 -0700 + Commit: acbf307, github.com/apache/spark/pull/626 + + Whitelist Hive Tests + Michael Armbrust + 2014-05-03 23:13:51 -0700 + Commit: e88a636, github.com/apache/spark/pull/596 + + [SQL] Better logging when applying rules. + Michael Armbrust + 2014-05-03 18:38:44 -0700 + Commit: e24d5cd, github.com/apache/spark/pull/616 + + EC2 configurable workers + Allan Douglas R. de Oliveira + 2014-05-03 16:52:19 -0700 + Commit: 8406ac4, github.com/apache/spark/pull/612 + + SPARK-1689 AppClient should indicate app is dead() when removed + Aaron Davidson + 2014-05-03 13:27:10 -0700 + Commit: 36e687d, github.com/apache/spark/pull/605 + + [Bugfix] Tachyon file cleanup logical error + Cheng Lian + 2014-05-03 13:23:52 -0700 + Commit: bc3bfea, github.com/apache/spark/pull/575 + + SPARK-1663. Corrections for several compile errors in streaming code examples, and updates to follow API changes + Sean Owen + 2014-05-03 12:31:31 -0700 + Commit: 08c4d11, github.com/apache/spark/pull/589 + + [WIP] SPARK-1676: Cache Hadoop UGIs by default to prevent FileSystem leak + Thomas Graves + 2014-05-03 10:59:05 -0700 + Commit: 0441515, github.com/apache/spark/pull/621 + + Update SchemaRDD.scala + ArcherShao + 2014-05-03 00:17:36 -0700 + Commit: 34f22bc, github.com/apache/spark/pull/619 + + SPARK-1700: Close socket file descriptors on task completion + Aaron Davidson + 2014-05-02 23:55:13 -0700 + Commit: d2cbd3d, github.com/apache/spark/pull/623 + + SPARK-1492. Update Spark YARN docs to use spark-submit + Sandy Ryza + 2014-05-02 21:42:31 -0700 + Commit: a314342, github.com/apache/spark/pull/601 + + delete no use var + wangfei + 2014-05-02 21:34:54 -0700 + Commit: b65def7, github.com/apache/spark/pull/613 + + SPARK-1695: java8-tests compiler error: package com.google.common.co... + witgo + 2014-05-02 12:40:27 -0700 + Commit: d28c058, github.com/apache/spark/pull/611 + + Add tests for FileLogger, EventLoggingListener, and ReplayListenerBus + Andrew Or + 2014-05-01 21:42:06 -0700 + Commit: d4c8af8, github.com/apache/spark/pull/591 + + SPARK-1659: improvements spark-submit usage + witgo + 2014-05-01 21:39:40 -0700 + Commit: 18595dd, github.com/apache/spark/pull/581 + + fix the spelling mistake + wangfei + 2014-05-01 21:37:22 -0700 + Commit: 35ca6c5, github.com/apache/spark/pull/614 + + [SQL] SPARK-1661 - Fix regex_serde test + Michael Armbrust + 2014-05-01 21:32:43 -0700 + Commit: d339b33, github.com/apache/spark/pull/595 + + SPARK-1691: Support quoted arguments inside of spark-submit. + Patrick Wendell + 2014-05-01 01:15:51 -0700 + Commit: dd601bf, github.com/apache/spark/pull/609 + + Fix SPARK-1629: Spark should inline use of commons-lang `SystemUtils.IS_... + witgo + 2014-04-30 09:49:45 -0700 + Commit: 74bb88b, github.com/apache/spark/pull/569 + + SPARK-1004. PySpark on YARN + Sandy Ryza + 2014-04-29 23:24:34 -0700 + Commit: 177361c, github.com/apache/spark/pull/30 + + Handle the vals that never used + WangTao + 2014-04-29 22:07:20 -0700 + Commit: b0ded1f, github.com/apache/spark/pull/565 + + Args for worker rather than master + Chen Chao + 2014-04-29 22:05:40 -0700 + Commit: 775020f, github.com/apache/spark/pull/587 + + [SPARK-1646] Micro-optimisation of ALS + Tor Myklebust + 2014-04-29 22:04:34 -0700 + Commit: 92269f9, github.com/apache/spark/pull/568 + + [SPARK-1674] fix interrupted system call error in pyspark's RDD.pipe + Xiangrui Meng + 2014-04-29 18:06:45 -0700 + Commit: 919ed31, github.com/apache/spark/pull/594 + + SPARK-1588. Restore SPARK_YARN_USER_ENV and SPARK_JAVA_OPTS for YARN. + Sandy Ryza + 2014-04-29 12:54:02 -0700 + Commit: 5f48721, github.com/apache/spark/pull/586 + + SPARK-1509: add zipWithIndex zipWithUniqueId methods to java api + witgo + 2014-04-29 11:30:47 -0700 + Commit: 9754d1b, github.com/apache/spark/pull/423 + + SPARK-1557 Set permissions on event log files/directories + Thomas Graves + 2014-04-29 09:19:48 -0500 + Commit: bccd13e, github.com/apache/spark/pull/538 + + HOTFIX: minor change to release script + Patrick Wendell + 2014-04-29 00:59:38 -0700 + Commit: c27ce2b + + HOTFIX: minor change to release script + Patrick Wendell + 2014-04-29 00:53:32 -0700 + Commit: 838cb0e + + [SPARK-1636][MLLIB] Move main methods to examples + Xiangrui Meng + 2014-04-29 00:41:03 -0700 + Commit: aa519e3, github.com/apache/spark/pull/584 + + Minor fix to python table caching API. + Michael Armbrust + 2014-04-29 00:36:15 -0700 + Commit: 0995787, github.com/apache/spark/pull/585 + + HOTFIX: Bug in release script + Patrick Wendell + 2014-04-29 00:10:17 -0700 + Commit: 4ed58aa + + Manual revert of rc2 version changes. + Patrick Wendell + 2014-04-28 22:59:09 -0700 + Commit: 2863344 + + Improved build configuration + witgo + 2014-04-28 22:50:51 -0700 + Commit: ee96460, github.com/apache/spark/pull/480 + + SPARK-1652: Remove incorrect deprecation warning in spark-submit + Patrick Wendell + 2014-04-28 18:14:59 -0700 + Commit: 42ba706, github.com/apache/spark/pull/578 + + SPARK-1654 and SPARK-1653: Fixes in spark-submit. + Patrick Wendell + 2014-04-28 17:29:22 -0700 + Commit: 2c9ce20, github.com/apache/spark/pull/576 + + SPARK-1652: Spark submit should fail gracefully if YARN not enabled + Patrick Wendell + 2014-04-28 17:26:57 -0700 + Commit: 38bf23e, github.com/apache/spark/pull/579 + + Changes to dev release script + Patrick Wendell + 2014-04-28 13:58:42 -0700 + Commit: 32d9db3 + + [SPARK-1633][Streaming] Java API unit test and example for custom streaming receiver in Java + Tathagata Das + 2014-04-28 13:58:09 -0700 + Commit: 6d89faf, github.com/apache/spark/pull/558 + + [SQL]Append some missing types for HiveUDF + Cheng Hao + 2014-04-27 23:59:42 -0700 + Commit: 42cb3b4, github.com/apache/spark/pull/459 + + Update the import package name for TestHive in sbt shell + Cheng Hao + 2014-04-27 23:57:29 -0700 + Commit: eb9308e, github.com/apache/spark/pull/574 + + Fix SPARK-1609: Executor fails to start when Command.extraJavaOptions contains multiple Java options + witgo + 2014-04-27 19:41:02 -0700 + Commit: 7bbf313, github.com/apache/spark/pull/547 + + SPARK-1145: Memory mapping with many small blocks can cause JVM allocation failures + Patrick Wendell + 2014-04-27 17:40:56 -0700 + Commit: 2f24159, github.com/apache/spark/pull/43 + + HOTFIX: Minor patch to merge script. + Patrick Wendell + 2014-04-27 15:45:17 -0700 + Commit: 99285d0 + + SPARK-1651: Delete existing deployment directory + Rahul Singhal + 2014-04-27 15:50:48 -0700 + Commit: 3c6c6c2, github.com/apache/spark/pull/573 + + SPARK-1648 Support closing JIRA's as part of merge script. + Patrick Wendell + 2014-04-27 15:41:57 -0700 + Commit: da26f9b, github.com/apache/spark/pull/570 + + SPARK-1650: Correctly identify maven project version + Rahul Singhal + 2014-04-27 15:17:06 -0700 + Commit: 98b13e0, github.com/apache/spark/pull/572 + + SPARK-1606: Infer user application arguments instead of requiring --arg. + Patrick Wendell + 2014-04-26 19:24:29 -0700 + Commit: ce57624, github.com/apache/spark/pull/563 + + SPARK-1467: Make StorageLevel.apply() factory methods Developer APIs + Sandeep + 2014-04-26 19:04:33 -0700 + Commit: 18ecc63, github.com/apache/spark/pull/551 + + [SPARK-1608] [SQL] Fix Cast.nullable when cast from StringType to NumericType/TimestampType. + Takuya UESHIN + 2014-04-26 14:39:54 -0700 + Commit: dcea67f, github.com/apache/spark/pull/532 + + add note of how to support table with more than 22 fields + wangfei + 2014-04-26 14:38:42 -0700 + Commit: a020686, github.com/apache/spark/pull/564 + + [Spark-1382] Fix NPE in DStream.slice (updated version of #365) + zsxwing , Tathagata Das + 2014-04-25 19:04:34 -0700 + Commit: f85c681, github.com/apache/spark/pull/562 + + SPARK-1632. Remove unnecessary boxing in compares in ExternalAppendOnlyM... + Sandy Ryza + 2014-04-25 17:55:04 -0700 + Commit: 94c71e0, github.com/apache/spark/pull/559 + + SPARK-1235: manage the DAGScheduler EventProcessActor with supervisor and refactor the DAGScheduler with Akka + CodingCat , Xiangrui Meng , Nan Zhu + 2014-04-25 16:04:48 -0700 + Commit: 5673c1e, github.com/apache/spark/pull/186 + + SPARK-1607. HOTFIX: Fix syntax adapting Int result to Short + Sean Owen + 2014-04-25 14:17:38 -0700 + Commit: 784b2a6, github.com/apache/spark/pull/556 + + Update KafkaWordCount.scala + baishuo(白硕) + 2014-04-25 13:18:49 -0700 + Commit: a0912a8, github.com/apache/spark/pull/523 + + Delete the val that never used + WangTao + 2014-04-25 11:47:01 -0700 + Commit: 97bfeda, github.com/apache/spark/pull/553 + + SPARK-1621 Upgrade Chill to 0.3.6 + Matei Zaharia + 2014-04-25 11:12:41 -0700 + Commit: 2c8dfd4, github.com/apache/spark/pull/543 + + SPARK-1619 Launch spark-shell with spark-submit + Patrick Wendell + 2014-04-24 23:59:16 -0700 + Commit: 8ba7f40, github.com/apache/spark/pull/542 + + SPARK-1607. Replace octal literals, removed in Scala 2.11, with hex literals + Sean Owen + 2014-04-24 23:34:00 -0700 + Commit: 7493ca9, github.com/apache/spark/pull/529 + + Call correct stop(). + Aaron Davidson + 2014-04-24 23:22:03 -0700 + Commit: 3eba9bd, github.com/apache/spark/pull/527 + + SPARK-1242 Add aggregate to python rdd + Holden Karau + 2014-04-24 23:07:54 -0700 + Commit: f09a2c0, github.com/apache/spark/pull/139 + + Fix [SPARK-1078]: Remove the Unnecessary lift-json dependency + Sandeep + 2014-04-24 21:51:52 -0700 + Commit: 496b9ae, github.com/apache/spark/pull/536 + + [Typo] In the maven docs: chd -> cdh + Andrew Or + 2014-04-24 21:51:17 -0700 + Commit: db69841, github.com/apache/spark/pull/548 + + Generalize pattern for planning hash joins. + Michael Armbrust + 2014-04-24 21:42:33 -0700 + Commit: ab131ab, github.com/apache/spark/pull/418 + + [SPARK-1617] and [SPARK-1618] Improvements to streaming ui and bug fix to socket receiver + Tathagata Das + 2014-04-24 21:34:37 -0700 + Commit: d933c71, github.com/apache/spark/pull/540 + + SPARK-1584: Upgrade Flume dependency to 1.4.0 + tmalaska + 2014-04-24 20:31:17 -0700 + Commit: 777a9a5, github.com/apache/spark/pull/507 + + SPARK-1586 Windows build fixes + Mridul Muralidharan + 2014-04-24 20:48:33 -0700 + Commit: 51a387a, github.com/apache/spark/pull/505 + + [SPARK-986]: Job cancelation for PySpark + Ahir Reddy + 2014-04-24 20:21:10 -0700 + Commit: 7b6d774, github.com/apache/spark/pull/541 + + [SPARK-1615] Synchronize accesses to the LiveListenerBus' event queue + Andrew Or + 2014-04-24 20:18:15 -0700 + Commit: 963046c, github.com/apache/spark/pull/544 + + [SPARK-1510] Spark Streaming metrics source for metrics system + jerryshao , Tathagata Das + 2014-04-24 18:56:57 -0700 + Commit: 0bc0f36, github.com/apache/spark/pull/545 + + Spark 1489 Fix the HistoryServer view acls + Thomas Graves + 2014-04-24 18:38:10 -0700 + Commit: c8dd132, github.com/apache/spark/pull/509 + + [SQL] Add support for parsing indexing into arrays in SQL. + Michael Armbrust + 2014-04-24 18:21:00 -0700 + Commit: 2a35fba, github.com/apache/spark/pull/518 + + [SPARK-1592][streaming] Automatically remove streaming input blocks + Tathagata Das + 2014-04-24 18:18:22 -0700 + Commit: a3b6d85, github.com/apache/spark/pull/512 + + SPARK-1438 RDD.sample() make seed param optional + Arun Ramakrishnan + 2014-04-24 17:27:16 -0700 + Commit: 521d435, github.com/apache/spark/pull/477 + + SPARK-1104: kill Process in workerThread of ExecutorRunner + CodingCat + 2014-04-24 15:55:18 -0700 + Commit: a1f8779, github.com/apache/spark/pull/35 + + Fix Scala Style + Sandeep + 2014-04-24 15:07:23 -0700 + Commit: 2250c7a, github.com/apache/spark/pull/531 + + SPARK-1494 Don't initialize classes loaded by MIMA excludes, attempt 2 + Michael Armbrust + 2014-04-24 14:54:01 -0700 + Commit: 5ca01f6, github.com/apache/spark/pull/526 + + Spark 1490 Add kerberos support to the HistoryServer + Thomas Graves + 2014-04-24 11:15:12 -0700 + Commit: 866b03e, github.com/apache/spark/pull/513 + + SPARK-1611: Fix incorrect initialization order in AppendOnlyMap + zsxwing + 2014-04-24 11:13:40 -0700 + Commit: 00a3ccc, github.com/apache/spark/pull/534 + + SPARK-1488. Squash more language feature warnings in new commits by importing implicitConversion + Sean Owen + 2014-04-24 10:06:18 -0700 + Commit: 8d92d93, github.com/apache/spark/pull/528 + + Small changes to release script + Patrick Wendell + 2014-04-24 09:59:44 -0700 + Commit: 563be2f + + [SPARK-1610] [SQL] Fix Cast to use exact type value when cast from BooleanType to NumericTy... + Takuya UESHIN + 2014-04-24 09:57:28 -0700 + Commit: 8f8e051, github.com/apache/spark/pull/533 + + SPARK-1601 & SPARK-1602: two bug fixes related to cancellation + Reynold Xin + 2014-04-24 00:27:45 -0700 + Commit: f98aac9, github.com/apache/spark/pull/521 + + SPARK-1587 Fix thread leak + Mridul Muralidharan + 2014-04-23 23:20:55 -0700 + Commit: 8684a15, github.com/apache/spark/pull/504 + + [Fix #79] Replace Breakable For Loops By While Loops + Sandeep + 2014-04-23 22:47:59 -0700 + Commit: e890771, github.com/apache/spark/pull/503 + + SPARK-1589: Fix the incorrect compare + zsxwing + 2014-04-23 22:36:02 -0700 + Commit: 9716a72, github.com/apache/spark/pull/508 + + Mark all fields of EdgePartition, Graph, and GraphOps transient + Ankur Dave + 2014-04-23 22:01:13 -0700 + Commit: bdd2691, github.com/apache/spark/pull/520 + + Update Java api for setJobGroup with interruptOnCancel + Aaron Davidson + 2014-04-23 22:00:22 -0700 + Commit: 36511ea, github.com/apache/spark/pull/522 + + [Hot Fix #469] Fix flaky test in SparkListenerSuite + Andrew Or + 2014-04-23 21:59:33 -0700 + Commit: 99c0c33, github.com/apache/spark/pull/516 + + [SPARK-1540] Add an optional Ordering parameter to PairRDDFunctions. + Matei Zaharia + 2014-04-23 17:03:54 -0700 + Commit: 31c7d83, github.com/apache/spark/pull/487 + + SPARK-1582 Invoke Thread.interrupt() when cancelling jobs + Aaron Davidson + 2014-04-23 16:52:49 -0700 + Commit: 55e6bea, github.com/apache/spark/pull/498 + + Honor default fs name when initializing event logger. + Marcelo Vanzin + 2014-04-23 14:47:38 -0700 + Commit: 46b30f9, github.com/apache/spark/pull/450 + + SPARK-1572 Don't kill Executor if PythonRDD fails while computing parent + Aaron Davidson + 2014-04-23 14:46:30 -0700 + Commit: be8f26f, github.com/apache/spark/pull/486 + + SPARK-1583: Fix a bug that using java.util.HashMap by mistake + zsxwing + 2014-04-23 14:12:20 -0700 + Commit: 19ef78f, github.com/apache/spark/pull/500 + + SPARK-1119 and other build improvements + Patrick Wendell + 2014-04-23 10:19:32 -0700 + Commit: d36d75c, github.com/apache/spark/pull/502 + + [SQL] SPARK-1571 Mistake in java example code + Michael Armbrust + 2014-04-22 22:19:32 -0700 + Commit: b0d8793, github.com/apache/spark/pull/496 + + SPARK-1494 Don't initialize classes loaded by MIMA excludes. + Michael Armbrust + 2014-04-22 21:56:15 -0700 + Commit: 18b1867, github.com/apache/spark/pull/494 + + SPARK-1562 Fix visibility / annotation of Spark SQL APIs + Michael Armbrust + 2014-04-22 20:02:33 -0700 + Commit: 0e03e6a, github.com/apache/spark/pull/489 + + [FIX: SPARK-1376] use --arg instead of --args in SparkSubmit to avoid warning messages + Xiangrui Meng + 2014-04-22 19:38:27 -0700 + Commit: 61930bd, github.com/apache/spark/pull/485 + + [streaming][SPARK-1578] Removed requirement for TTL in StreamingContext. + Tathagata Das + 2014-04-22 19:35:13 -0700 + Commit: bf47559, github.com/apache/spark/pull/491 + + [Spark-1538] Fix SparkUI incorrectly hiding persisted RDDs + Andrew Or + 2014-04-22 19:24:03 -0700 + Commit: 104590c, github.com/apache/spark/pull/469 + + Assorted clean-up for Spark-on-YARN. + Patrick Wendell + 2014-04-22 19:22:06 -0700 + Commit: f764f47, github.com/apache/spark/pull/488 + + [SPARK-1570] Fix classloading in JavaSQLContext.applySchema + Kan Zhang + 2014-04-22 15:05:12 -0700 + Commit: f9734e2, github.com/apache/spark/pull/484 + + Fix compilation on Hadoop 2.4.x. + Marcelo Vanzin + 2014-04-22 14:28:41 -0700 + Commit: b6ba546, github.com/apache/spark/pull/483 + + [Fix #204] Eliminate delay between binding and log checking + Andrew Or + 2014-04-22 14:27:49 -0700 + Commit: 54c96c2, github.com/apache/spark/pull/441 + + [Fix #274] Document + fix annotation usages + Andrew Or + 2014-04-21 22:24:44 -0700 + Commit: 898fc34, github.com/apache/spark/pull/470 + + [HOTFIX] SPARK-1399: remove outdated comments + CodingCat + 2014-04-22 09:43:13 -0700 + Commit: 61d7401, github.com/apache/spark/pull/474 + + [SPARK-1281] Improve partitioning in ALS + Tor Myklebust + 2014-04-22 11:07:30 -0700 + Commit: 4834adf, github.com/apache/spark/pull/407 + + fix bugs of dot in python + Xusen Yin + 2014-04-22 11:06:18 -0700 + Commit: 4f2f093, github.com/apache/spark/pull/463 + + [SPARK-1506][MLLIB] Documentation improvements for MLlib 1.0 + Xiangrui Meng + 2014-04-22 11:20:47 -0700 + Commit: 3f708f5, github.com/apache/spark/pull/422 + + [SPARK-1560]: Updated Pyrolite Dependency to be Java 6 compatible + Ahir Reddy + 2014-04-22 09:44:41 -0700 + Commit: 798d93f, github.com/apache/spark/pull/479 + + SPARK-1496: Have jarOfClass return Option[String] + Patrick Wendell + 2014-04-22 00:42:16 -0700 + Commit: 72aa131, github.com/apache/spark/pull/438 + + [SPARK-1459] Use local path (and not complete URL) when opening local lo... + Marcelo Vanzin + 2014-04-21 23:10:53 -0700 + Commit: 0a73103, github.com/apache/spark/pull/375 + + [SPARK-1439, SPARK-1440] Generate unified Scaladoc across projects and Javadocs + Matei Zaharia + 2014-04-21 21:57:40 -0700 + Commit: b0d70e4, github.com/apache/spark/pull/457 + + [SPARK-1332] Improve Spark Streaming's Network Receiver and InputDStream API [WIP] + Tathagata Das + 2014-04-21 19:04:49 -0700 + Commit: 94cbe23, github.com/apache/spark/pull/300 + + Updating versions for Spark 1.0 + Patrick Wendell + 2014-04-21 16:59:38 -0700 + Commit: a34e6fd + + Dev script: include RC name in git tag + Patrick Wendell + 2014-04-21 14:21:17 -0700 + Commit: 1532af9 + + SPARK-1399: show stage failure reason in UI + CodingCat , Nan Zhu + 2014-04-21 14:10:23 -0700 + Commit: 4b9220d, github.com/apache/spark/pull/421 + + SPARK-1539: RDDPage.scala contains RddPage class + Xiangrui Meng + 2014-04-21 12:48:02 -0700 + Commit: 8aa3860, github.com/apache/spark/pull/454 + + [Hot Fix] Ignore org.apache.spark.ui.UISuite tests + Andrew Or + 2014-04-21 12:37:43 -0700 + Commit: d62ce6d, github.com/apache/spark/pull/466 + + REPL cleanup. + Michael Armbrust + 2014-04-19 17:32:24 -0700 + Commit: 8e1e7ec, github.com/apache/spark/pull/451 + + Clean up and simplify Spark configuration + Patrick Wendell + 2014-04-21 10:26:33 -0700 + Commit: 29ee101, github.com/apache/spark/pull/299 + + [SPARK-1535] ALS: Avoid the garbage-creating ctor of DoubleMatrix + Tor Myklebust + 2014-04-19 15:10:18 -0700 + Commit: 9ce6ed4, github.com/apache/spark/pull/442 + + Add insertInto and saveAsTable to Python API. + Michael Armbrust + 2014-04-19 15:08:54 -0700 + Commit: 6ab0719, github.com/apache/spark/pull/447 + + Use scala deprecation instead of java. + Michael Armbrust + 2014-04-19 15:06:04 -0700 + Commit: bfb09c6, github.com/apache/spark/pull/452 + + README update + Reynold Xin + 2014-04-18 22:34:39 -0700 + Commit: 2fe6b18, github.com/apache/spark/pull/443 + + SPARK-1482: Fix potential resource leaks in saveAsHadoopDataset and save... + zsxwing + 2014-04-18 17:49:22 -0700 + Commit: ea17460, github.com/apache/spark/pull/400 + + SPARK-1456 Remove view bounds on Ordered in favor of a context bound on Ordering. + Michael Armbrust + 2014-04-18 12:04:13 -0700 + Commit: 9e21b97, github.com/apache/spark/pull/410 + + Fixed broken pyspark shell. + Reynold Xin + 2014-04-18 10:10:13 -0700 + Commit: d8767c4, github.com/apache/spark/pull/444 + + SPARK-1523: improve the readability of code in AkkaUtil + CodingCat + 2014-04-18 10:05:00 -0700 + Commit: 171cea8, github.com/apache/spark/pull/434 + + SPARK-1357 (addendum). More Experimental items in MLlib + Sean Owen + 2014-04-18 10:04:02 -0700 + Commit: 1a30429, github.com/apache/spark/pull/372 + + [SPARK-1520] remove fastutil from dependencies + Xiangrui Meng + 2014-04-18 10:03:15 -0700 + Commit: c40eec8, github.com/apache/spark/pull/437 + + Reuses Row object in ExistingRdd.productToRowRdd() + Cheng Lian + 2014-04-18 10:02:27 -0700 + Commit: 977467e, github.com/apache/spark/pull/432 + + SPARK-1483: Rename minSplits to minPartitions in public APIs + CodingCat + 2014-04-18 10:01:16 -0700 + Commit: 969a075, github.com/apache/spark/pull/430 + + HOTFIX: Ignore streaming UI test + Patrick Wendell + 2014-04-17 17:33:24 -0700 + Commit: 1c0dc37, github.com/apache/spark/pull/440 + + FIX: Don't build Hive in assembly unless running Hive tests. + Patrick Wendell + 2014-04-17 17:24:00 -0700 + Commit: 3225272, github.com/apache/spark/pull/439 + + Add clean to build + Patrick Wendell + 2014-04-16 16:32:34 -0700 + Commit: 67d01d8 + + HOTFIX: Use file name and not paths for excludes + Patrick Wendell + 2014-04-14 15:51:54 -0700 + Commit: 5349fab + + SPARK-1408 Modify Spark on Yarn to point to the history server when app ... + Thomas Graves + 2014-04-17 16:36:37 -0500 + Commit: 6195fb8, github.com/apache/spark/pull/362 + + [SPARK-1395] Allow "local:" URIs to work on Yarn. + Marcelo Vanzin + 2014-04-17 10:29:38 -0500 + Commit: a83a794, github.com/apache/spark/pull/303 + + [python alternative] pyspark require Python2, failing if system default is Py3 from shell.py + AbhishekKr + 2014-04-16 19:05:40 -0700 + Commit: b3ad707, github.com/apache/spark/pull/399 + + SPARK-1462: Examples of ML algorithms are using deprecated APIs + Sandeep + 2014-04-16 18:23:07 -0700 + Commit: 13fb4c7, github.com/apache/spark/pull/416 + + Include stack trace for exceptions thrown by user code. + Michael Armbrust + 2014-04-16 18:12:56 -0700 + Commit: aef8a4a, github.com/apache/spark/pull/409 + + Update ReducedWindowedDStream.scala + baishuo(白硕) + 2014-04-16 18:08:11 -0700 + Commit: 822353d, github.com/apache/spark/pull/425 + + misleading task number of groupByKey + Chen Chao + 2014-04-16 17:58:42 -0700 + Commit: 51c41da, github.com/apache/spark/pull/403 + + Fixing a race condition in event listener unit test + Kan Zhang + 2014-04-16 17:39:11 -0700 + Commit: f0abf5f, github.com/apache/spark/pull/401 + + remove unnecessary brace and semicolon in 'putBlockInfo.synchronize' block + Chen Chao + 2014-04-16 17:30:01 -0700 + Commit: e43e31d, github.com/apache/spark/pull/411 + + SPARK-1329: Create pid2vid with correct number of partitions + Ankur Dave + 2014-04-16 17:16:55 -0700 + Commit: b4ea3d9, github.com/apache/spark/pull/368 + + Rebuild routing table after Graph.reverse + Ankur Dave + 2014-04-16 17:15:50 -0700 + Commit: 602b9ea, github.com/apache/spark/pull/431 + + [SPARK-1511] use Files.move instead of renameTo in TestUtils.scala + Ye Xianjin + 2014-04-16 14:56:22 -0700 + Commit: 87a7c4f, github.com/apache/spark/pull/427 + + SPARK-1465: Spark compilation is broken with the latest hadoop-2.4.0 release + xuan , xuan + 2014-04-16 14:41:22 -0500 + Commit: d8fc4a4, github.com/apache/spark/pull/396 + + SPARK-1469: Scheduler mode should accept lower-case definitions and have... + Sandeep + 2014-04-16 09:58:57 -0700 + Commit: b75301f, github.com/apache/spark/pull/388 + + Minor addition to SPARK-1497 + Patrick Wendell + 2014-04-16 09:43:17 -0700 + Commit: 4479ecd + + SPARK-1497. Fix scalastyle warnings in YARN, Hive code + Sean Owen + 2014-04-16 09:34:59 -0700 + Commit: c744d66, github.com/apache/spark/pull/413 + + SPARK-1310: Start adding k-fold cross validation to MLLib [adds kFold to MLUtils & fixes bug in BernoulliSampler] + Holden Karau + 2014-04-16 09:33:27 -0700 + Commit: 8efec04, github.com/apache/spark/pull/18 + + update spark.default.parallelism + Chen Chao + 2014-04-16 09:14:18 -0700 + Commit: e4f5577, github.com/apache/spark/pull/389 + + Loads test tables when running "sbt hive/console" without HIVE_DEV_HOME + Cheng Lian + 2014-04-16 08:54:34 -0700 + Commit: 9e908ab, github.com/apache/spark/pull/417 + + Make "spark logo" link refer to "/". + Marcelo Vanzin + 2014-04-16 08:53:01 -0700 + Commit: 5fe18a7, github.com/apache/spark/pull/408 + + [SPARK-959] Updated SBT from 0.13.1 to 0.13.2 + Cheng Lian + 2014-04-16 08:52:14 -0700 + Commit: 1ea9a21, github.com/apache/spark/pull/426 + + [SQL] SPARK-1424 Generalize insertIntoTable functions on SchemaRDDs + Michael Armbrust + 2014-04-15 20:40:40 -0700 + Commit: e5130d9, github.com/apache/spark/pull/354 + + [WIP] SPARK-1430: Support sparse data in Python MLlib + Matei Zaharia + 2014-04-15 20:33:24 -0700 + Commit: 95647fa, github.com/apache/spark/pull/341 + + [FIX] update sbt-idea to version 1.6.0 + Xiangrui Meng + 2014-04-15 19:37:32 -0700 + Commit: 33d6e37, github.com/apache/spark/pull/419 + + SPARK-1455: Better isolation for unit tests. + Patrick Wendell + 2014-04-15 19:34:39 -0700 + Commit: 110e825, github.com/apache/spark/pull/420 + + Decision Tree documentation for MLlib programming guide + Manish Amde + 2014-04-15 11:14:28 -0700 + Commit: 194ed06, github.com/apache/spark/pull/402 + + [SPARK-1157][MLlib] L-BFGS Optimizer based on Breeze's implementation. + DB Tsai + 2014-04-15 11:12:47 -0700 + Commit: 5812472, github.com/apache/spark/pull/353 + + SPARK-1501: Ensure assertions in Graph.apply are asserted. + William Benton + 2014-04-15 10:38:42 -0700 + Commit: 692dd69, github.com/apache/spark/pull/415 + + SPARK-1426: Make MLlib work with NumPy versions older than 1.7 + Sandeep + 2014-04-15 00:19:43 -0700 + Commit: 1491b2a, github.com/apache/spark/pull/391 + + SPARK-1374: PySpark API for SparkSQL + Ahir Reddy , Michael Armbrust + 2014-04-15 00:07:55 -0700 + Commit: 7433f64, github.com/apache/spark/pull/363 + + SPARK-1488. Resolve scalac feature warnings during build + Sean Owen + 2014-04-14 19:50:00 -0700 + Commit: 7471828, github.com/apache/spark/pull/404 + + [BUGFIX] In-memory columnar storage bug fixes + Cheng Lian , Michael Armbrust + 2014-04-14 15:22:43 -0700 + Commit: fdebb69, github.com/apache/spark/pull/374 + + [SPARK-1415] Hadoop min split for wholeTextFiles() + Xusen Yin + 2014-04-13 13:18:52 -0700 + Commit: 1cf565f, github.com/apache/spark/pull/376 + + SPARK-1480: Clean up use of classloaders + Patrick Wendell + 2014-04-13 08:58:37 -0700 + Commit: 3537e25, github.com/apache/spark/pull/398 + + [SPARK-1403] Move the class loader creation back to where it was in 0.9.0 + Bharath Bhushan + 2014-04-12 20:52:29 -0700 + Commit: c970d86, github.com/apache/spark/pull/322 + + [Fix #204] Update out-dated comments + Andrew Or + 2014-04-12 16:33:38 -0700 + Commit: 52d401b, github.com/apache/spark/pull/381 + + [SPARK-1386] Web UI for Spark Streaming + Tathagata Das , Andrew Or + 2014-04-11 23:33:49 -0700 + Commit: f36dc3f, github.com/apache/spark/pull/290 + + SPARK-1057 (alternative) Remove fastutil + Sean Owen + 2014-04-11 22:46:47 -0700 + Commit: 4dfcb38, github.com/apache/spark/pull/266 + + Update WindowedDStream.scala + baishuo(白硕) + 2014-04-11 20:33:42 -0700 + Commit: dac6240, github.com/apache/spark/pull/390 + + [WIP] [SPARK-1328] Add vector statistics + Xusen Yin , Xiangrui Meng + 2014-04-11 19:43:22 -0700 + Commit: ce0ce3d, github.com/apache/spark/pull/268 + + [FIX] make coalesce test deterministic in RDDSuite + Xiangrui Meng + 2014-04-11 19:41:40 -0700 + Commit: 9afaeed, github.com/apache/spark/pull/387 + + HOTFIX: Ignore python metastore files in RAT checks. + Patrick Wendell + 2014-04-11 13:23:21 -0700 + Commit: 79eb276, github.com/apache/spark/pull/393 + + [SPARK-1225, 1241] [MLLIB] Add AreaUnderCurve and BinaryClassificationMetrics + Xiangrui Meng + 2014-04-11 12:06:13 -0700 + Commit: e6128b5, github.com/apache/spark/pull/364 + + Some clean up in build/docs + Patrick Wendell + 2014-04-11 10:45:27 -0700 + Commit: 170b09d, github.com/apache/spark/pull/382 + + SPARK-1417: Spark on Yarn - spark UI link from resourcemanager is broken + Thomas Graves + 2014-04-11 13:17:48 +0530 + Commit: 9e90c46, github.com/apache/spark/pull/344 + + SPARK-1202: Improvements to task killing in the UI. + Patrick Wendell + 2014-04-10 20:43:56 -0700 + Commit: a1bb4c6, github.com/apache/spark/pull/386 + + Add Spark v0.9.1 to ec2 launch script and use it as the default + Harvey Feng + 2014-04-10 18:25:54 -0700 + Commit: 59de39b, github.com/apache/spark/pull/385 + + Set spark.executor.uri from environment variable (needed by Mesos) + Ivan Wick + 2014-04-10 17:49:30 -0700 + Commit: 41df293, github.com/apache/spark/pull/311 + + SPARK-1202 - Add a "cancel" button in the UI for stages + Sundeep Narravula , Sundeep Narravula + 2014-04-10 17:10:11 -0700 + Commit: 211f974, github.com/apache/spark/pull/246 + + [SQL] Improve column pruning in the optimizer. + Michael Armbrust + 2014-04-10 16:20:33 -0700 + Commit: 4843ef0, github.com/apache/spark/pull/378 + + Remove Unnecessary Whitespace's + Sandeep + 2014-04-10 15:04:13 -0700 + Commit: 09bf14b, github.com/apache/spark/pull/380 + + Update tuning.md + Andrew Ash + 2014-04-10 14:59:58 -0700 + Commit: 4c9906d, github.com/apache/spark/pull/384 + + Revert "SPARK-1433: Upgrade Mesos dependency to 0.17.0" + Patrick Wendell + 2014-04-10 14:43:29 -0700 + Commit: 1e2cdbc + + SPARK-1428: MLlib should convert non-float64 NumPy arrays to float64 instead of complaining + Sandeep + 2014-04-10 11:17:41 -0700 + Commit: 2ac43ad, github.com/apache/spark/pull/356 + + [SPARK-1276] Add a HistoryServer to render persisted UI + Andrew Or + 2014-04-10 10:39:34 -0700 + Commit: 9ae80bf, github.com/apache/spark/pull/204 + + Fix SPARK-1413: Parquet messes up stdout and stdin when used in Spark REPL + witgo + 2014-04-10 10:35:24 -0700 + Commit: a74fbbb, github.com/apache/spark/pull/325 + + Revert "SPARK-729: Closures not always serialized at capture time" + Patrick Wendell + 2014-04-10 02:10:40 -0700 + Commit: e6d4a74 + + SPARK-1446: Spark examples should not do a System.exit + Sandeep + 2014-04-10 00:37:21 -0700 + Commit: e55cc4b, github.com/apache/spark/pull/370 + + SPARK-729: Closures not always serialized at capture time + William Benton + 2014-04-09 18:56:27 -0700 + Commit: 8ca3b2b, github.com/apache/spark/pull/189 + + [SPARK-1357 (fix)] remove empty line after :: DeveloperApi/Experimental :: + Xiangrui Meng + 2014-04-09 17:08:17 -0700 + Commit: 0adc932, github.com/apache/spark/pull/373 + + SPARK-1407 drain event queue before stopping event logger + Kan Zhang + 2014-04-09 15:24:33 -0700 + Commit: eb5f2b6, github.com/apache/spark/pull/366 + + [SPARK-1357] [MLLIB] Annotate developer and experimental APIs + Xiangrui Meng + 2014-04-09 02:21:15 -0700 + Commit: bde9cc1, github.com/apache/spark/pull/298 + + SPARK-1093: Annotate developer and experimental API's + Patrick Wendell , Andrew Or + 2014-04-09 01:14:46 -0700 + Commit: 87bd1f9, github.com/apache/spark/pull/274 + + [SPARK-1390] Refactoring of matrices backed by RDDs + Xiangrui Meng + 2014-04-08 23:01:15 -0700 + Commit: 9689b66, github.com/apache/spark/pull/296 + + Spark-939: allow user jars to take precedence over spark jars + Holden Karau + 2014-04-08 22:29:21 -0700 + Commit: fa0524f, github.com/apache/spark/pull/217 + + [SPARK-1434] [MLLIB] change labelParser from anonymous function to trait + Xiangrui Meng + 2014-04-08 20:37:01 -0700 + Commit: b9e0c93, github.com/apache/spark/pull/345 + + Spark 1271: Co-Group and Group-By should pass Iterable[X] + Holden Karau + 2014-04-08 18:15:52 -0700 + Commit: ce8ec54, github.com/apache/spark/pull/242 + + SPARK-1433: Upgrade Mesos dependency to 0.17.0 + Sandeep + 2014-04-08 16:19:22 -0700 + Commit: 12c077d, github.com/apache/spark/pull/355 + + [SPARK-1397] Notify SparkListeners when stages fail or are cancelled. + Kay Ousterhout + 2014-04-08 14:42:02 -0700 + Commit: fac6085, github.com/apache/spark/pull/309 + + SPARK-1445: compute-classpath should not print error if lib_managed not found + Aaron Davidson + 2014-04-08 14:40:20 -0700 + Commit: e25b593, github.com/apache/spark/pull/361 + + SPARK-1348 binding Master, Worker, and App Web UI to all interfaces + Kan Zhang + 2014-04-08 14:30:24 -0700 + Commit: a8d86b0, github.com/apache/spark/pull/318 + + Remove extra semicolon in import statement and unused import in ApplicationMaster + Henry Saputra + 2014-04-08 14:23:16 -0700 + Commit: 3bc0548, github.com/apache/spark/pull/358 + + [SPARK-1396] Properly cleanup DAGScheduler on job cancellation. + Kay Ousterhout + 2014-04-08 01:03:33 -0700 + Commit: 6dc5f58, github.com/apache/spark/pull/305 + + [SPARK-1331] Added graceful shutdown to Spark Streaming + Tathagata Das + 2014-04-08 00:00:17 -0700 + Commit: 83ac9a4, github.com/apache/spark/pull/247 + + [SPARK-1103] Automatic garbage collection of RDD, shuffle and broadcast data + Tathagata Das , Andrew Or , Roman Pastukhov + 2014-04-07 23:40:21 -0700 + Commit: 11eabbe, github.com/apache/spark/pull/126 + + [SPARK-1402] Added 3 more compression schemes + Cheng Lian + 2014-04-07 22:24:12 -0700 + Commit: 0d0493f, github.com/apache/spark/pull/330 + + Change timestamp cast semantics. When cast to numeric types, return the unix time in seconds (instead of millis). + Reynold Xin + 2014-04-07 19:28:24 -0700 + Commit: f27e56a, github.com/apache/spark/pull/352 + + Added eval for Rand (without any support for user-defined seed). + Reynold Xin + 2014-04-07 18:40:08 -0700 + Commit: 31e6fff, github.com/apache/spark/pull/349 + + Removed the default eval implementation from Expression, and added a bunch of override's in classes I touched. + Reynold Xin + 2014-04-07 18:39:18 -0700 + Commit: 55dfd5d, github.com/apache/spark/pull/350 + + [sql] Rename execution/aggregates.scala Aggregate.scala, and added a bunch of private[this] to variables. + Reynold Xin + 2014-04-07 18:38:44 -0700 + Commit: 14c9238, github.com/apache/spark/pull/348 + + SPARK-1099: Introduce local[*] mode to infer number of cores + Aaron Davidson + 2014-04-07 13:06:30 -0700 + Commit: 0307db0, github.com/apache/spark/pull/182 + + HOTFIX: Disable actor input stream test. + Patrick Wendell + 2014-04-07 12:47:27 -0700 + Commit: 2a2ca48, github.com/apache/spark/pull/347 + + SPARK-1252. On YARN, use container-log4j.properties for executors + Sandy Ryza + 2014-04-07 13:28:14 -0500 + Commit: 9dd8b91, github.com/apache/spark/pull/148 + + [sql] Rename Expression.apply to eval for better readability. + Reynold Xin + 2014-04-07 10:45:31 -0700 + Commit: 83f2a2f, github.com/apache/spark/pull/340 + + SPARK-1432: Make sure that all metadata fields are properly cleaned + Davis Shepherd + 2014-04-07 10:02:00 -0700 + Commit: a3c51c6, github.com/apache/spark/pull/338 + + [SQL] SPARK-1427 Fix toString for SchemaRDD NativeCommands. + Michael Armbrust + 2014-04-07 01:46:50 -0700 + Commit: b5bae84, github.com/apache/spark/pull/343 + + [SQL] SPARK-1371 Hash Aggregation Improvements + Michael Armbrust + 2014-04-07 00:14:00 -0700 + Commit: accd099, github.com/apache/spark/pull/295 + + SPARK-1431: Allow merging conflicting pull requests + Patrick Wendell + 2014-04-06 21:04:45 -0700 + Commit: 87d0928, github.com/apache/spark/pull/342 + + SPARK-1154: Clean up app folders in worker nodes + Evan Chan , Kelvin Chu + 2014-04-06 19:17:33 -0700 + Commit: 1440154, github.com/apache/spark/pull/288 + + SPARK-1314: Use SPARK_HIVE to determine if we include Hive in packaging + Aaron Davidson + 2014-04-06 17:48:41 -0700 + Commit: 4106558, github.com/apache/spark/pull/237 + + SPARK-1349: spark-shell gets its own command history + Aaron Davidson + 2014-04-06 17:43:44 -0700 + Commit: 7ce52c4, github.com/apache/spark/pull/267 + + SPARK-1387. Update build plugins, avoid plugin version warning, centralize versions + Sean Owen + 2014-04-06 17:40:37 -0700 + Commit: 856c50f, github.com/apache/spark/pull/291 + + [SPARK-1259] Make RDD locally iterable + Egor Pakhomov + 2014-04-06 16:41:23 -0700 + Commit: e258e50, github.com/apache/spark/pull/156 + + Fix SPARK-1420 The maven build error for Spark Catalyst + witgo + 2014-04-06 16:03:06 -0700 + Commit: 7012ffa, github.com/apache/spark/pull/333 + + SPARK-1421. Make MLlib work on Python 2.6 + Matei Zaharia + 2014-04-05 20:52:05 -0700 + Commit: 0b85516, github.com/apache/spark/pull/335 + + Fix for PR #195 for Java 6 + Sean Owen + 2014-04-05 19:08:24 -0700 + Commit: 890d63b, github.com/apache/spark/pull/334 + + [SPARK-1371] fix computePreferredLocations signature to not depend on underlying implementation + Mridul Muralidharan + 2014-04-05 15:23:37 -0700 + Commit: 6e88583, github.com/apache/spark/pull/302 + + Remove the getStageInfo() method from SparkContext. + Kay Ousterhout + 2014-04-05 15:17:50 -0700 + Commit: 2d0150c, github.com/apache/spark/pull/308 + + HOTFIX for broken CI, by SPARK-1336 + Prashant Sharma , Prashant Sharma + 2014-04-04 22:49:19 -0700 + Commit: 7c18428, github.com/apache/spark/pull/321 + + small fix ( proogram -> program ) + Prabeesh K + 2014-04-04 21:32:00 -0700 + Commit: 0acc7a0, github.com/apache/spark/pull/331 + + [SQL] SPARK-1366 Consistent sql function across different types of SQLContexts + Michael Armbrust + 2014-04-04 21:15:33 -0700 + Commit: 8de038e, github.com/apache/spark/pull/319 + + SPARK-1305: Support persisting RDD's directly to Tachyon + Haoyuan Li , RongGu + 2014-04-04 20:36:24 -0700 + Commit: b50ddfd, github.com/apache/spark/pull/158 + + [SPARK-1419] Bumped parent POM to apache 14 + Mark Hamstra + 2014-04-04 19:19:48 -0700 + Commit: 1347ebd, github.com/apache/spark/pull/328 + + Add test utility for generating Jar files with compiled classes. + Patrick Wendell + 2014-04-04 19:15:15 -0700 + Commit: 5f3c1bb, github.com/apache/spark/pull/326 + + SPARK-1414. Python API for SparkContext.wholeTextFiles + Matei Zaharia + 2014-04-04 17:29:29 -0700 + Commit: 60e18ce, github.com/apache/spark/pull/327 + + [SQL] Minor fixes. + Michael Armbrust + 2014-04-04 17:23:17 -0700 + Commit: d956cc2, github.com/apache/spark/pull/315 + + [SPARK-1198] Allow pipes tasks to run in different sub-directories + Thomas Graves + 2014-04-04 17:16:31 -0700 + Commit: 198892f, github.com/apache/spark/pull/128 + + Don't create SparkContext in JobProgressListenerSuite. + Patrick Wendell + 2014-04-04 14:46:32 -0700 + Commit: a02b535, github.com/apache/spark/pull/324 + + SPARK-1375. Additional spark-submit cleanup + Sandy Ryza + 2014-04-04 13:28:42 -0700 + Commit: 16b8308, github.com/apache/spark/pull/278 + + [SPARK-1133] Add whole text files reader in MLlib + Xusen Yin + 2014-04-04 11:12:47 -0700 + Commit: f1fa617, github.com/apache/spark/pull/252 + + SPARK-1404: Always upgrade spark-env.sh vars to environment vars + Aaron Davidson + 2014-04-04 09:50:24 -0700 + Commit: 01cf4c4, github.com/apache/spark/pull/310 + + SPARK-1350. Always use JAVA_HOME to run executor container JVMs. + Sandy Ryza + 2014-04-04 08:54:04 -0500 + Commit: 7f32fd4, github.com/apache/spark/pull/313 + + SPARK-1337: Application web UI garbage collects newest stages + Patrick Wendell + 2014-04-03 22:13:56 -0700 + Commit: ee6e9e7, github.com/apache/spark/pull/320 + + Revert "[SPARK-1398] Removed findbugs jsr305 dependency" + Patrick Wendell + 2014-04-03 17:00:06 -0700 + Commit: 33e6361 + + Fix jenkins from giving the green light to builds that don't compile. + Michael Armbrust + 2014-04-03 16:53:35 -0700 + Commit: 9231b01, github.com/apache/spark/pull/317 + + [BUILD FIX] Fix compilation of Spark SQL Java API. + Michael Armbrust + 2014-04-03 16:12:08 -0700 + Commit: d94826b, github.com/apache/spark/pull/316 + + [SPARK-1134] Fix and document passing of arguments to IPython + Diana Carroll + 2014-04-03 15:48:42 -0700 + Commit: a599e43, github.com/apache/spark/pull/294 + + [SQL] SPARK-1333 First draft of java API + Michael Armbrust + 2014-04-03 15:45:34 -0700 + Commit: b8f5341, github.com/apache/spark/pull/248 + + Spark 1162 Implemented takeOrdered in pyspark. + Prashant Sharma + 2014-04-03 15:42:17 -0700 + Commit: c1ea3af, github.com/apache/spark/pull/97 + + [SPARK-1360] Add Timestamp Support for SQL + Cheng Hao + 2014-04-03 15:33:17 -0700 + Commit: 5d1feda, github.com/apache/spark/pull/275 + + Spark parquet improvements + Andre Schumacher + 2014-04-03 15:31:47 -0700 + Commit: fbebaed, github.com/apache/spark/pull/195 + + [SPARK-1398] Removed findbugs jsr305 dependency + Mark Hamstra + 2014-04-03 14:08:47 -0700 + Commit: 92a86b2, github.com/apache/spark/pull/307 + + [SQL] SPARK-1364 Improve datatype and test coverage for ScalaReflection schema inference. + Michael Armbrust + 2014-04-02 18:14:31 -0700 + Commit: 47ebea5, github.com/apache/spark/pull/293 + + [SPARK-1212, Part II] Support sparse data in MLlib + Xiangrui Meng + 2014-04-02 14:01:12 -0700 + Commit: 9c65fa7, github.com/apache/spark/pull/245 + + StopAfter / TopK related changes + Reynold Xin , Michael Armbrust + 2014-04-02 12:48:04 -0700 + Commit: ed730c9, github.com/apache/spark/pull/233 + + [SPARK-1371][WIP] Compression support for Spark SQL in-memory columnar storage + Cheng Lian + 2014-04-02 12:47:22 -0700 + Commit: 1faa579, github.com/apache/spark/pull/285 + + Do not re-use objects in the EdgePartition/EdgeTriplet iterators. + Daniel Darabos + 2014-04-02 12:27:37 -0700 + Commit: 7823633, github.com/apache/spark/pull/276 + + [SPARK-1385] Use existing code for JSON de/serialization of BlockId + Andrew Or + 2014-04-02 10:43:09 -0700 + Commit: de8eefa, github.com/apache/spark/pull/289 + + Renamed stageIdToActiveJob to jobIdToActiveJob. + Kay Ousterhout + 2014-04-02 10:35:52 -0700 + Commit: 11973a7, github.com/apache/spark/pull/301 + + Remove * from test case golden filename. + Michael Armbrust + 2014-04-01 23:54:38 -0700 + Commit: ea9de65, github.com/apache/spark/pull/297 + + MLI-1 Decision Trees + Manish Amde , manishamde , Xiangrui Meng + 2014-04-01 21:40:49 -0700 + Commit: 8b3045c, github.com/apache/spark/pull/79 + + Revert "[Spark-1134] only call ipython if no arguments are given; remove IPYTHONOPTS from call" + Matei Zaharia + 2014-04-01 19:31:50 -0700 + Commit: 45df912 + + [Spark-1134] only call ipython if no arguments are given; remove IPYTHONOPTS from call + Diana Carroll + 2014-04-01 19:29:26 -0700 + Commit: afb5ea6, github.com/apache/spark/pull/227 + + [SPARK-1342] Scala 2.10.4 + Mark Hamstra + 2014-04-01 18:35:50 -0700 + Commit: 764353d, github.com/apache/spark/pull/259 + + [SQL] SPARK-1372 Support for caching and uncaching tables in a SQLContext. + Michael Armbrust + 2014-04-01 14:45:44 -0700 + Commit: f5c418d, github.com/apache/spark/pull/282 + + [Hot Fix #42] Persisted RDD disappears on storage page if re-used + Andrew Or + 2014-03-31 23:01:14 -0700 + Commit: ada310a, github.com/apache/spark/pull/281 + + [SPARK-1377] Upgrade Jetty to 8.1.14v20131031 + Andrew Or + 2014-03-31 21:42:36 -0700 + Commit: 94fe7fd, github.com/apache/spark/pull/280 + + SPARK-1376. In the yarn-cluster submitter, rename "args" option to "arg" + Sandy Ryza + 2014-04-01 08:26:31 +0530 + Commit: 564f1c1, github.com/apache/spark/pull/279 + + SPARK-1365 [HOTFIX] Fix RateLimitedOutputStream test + Patrick Wendell + 2014-03-31 16:25:43 -0700 + Commit: 33b3c2a, github.com/apache/spark/pull/277 + + [SQL] Rewrite join implementation to allow streaming of one relation. + Michael Armbrust + 2014-03-31 15:23:46 -0700 + Commit: 5731af5, github.com/apache/spark/pull/250 + + SPARK-1352: Improve robustness of spark-submit script + Patrick Wendell + 2014-03-31 12:07:14 -0700 + Commit: 841721e, github.com/apache/spark/pull/271 + + SPARK-1352 - Comment style single space before ending */ check. + Prashant Sharma + 2014-03-30 10:06:56 -0700 + Commit: d666053, github.com/apache/spark/pull/261 + + [SPARK-1354][SQL] Add tableName as a qualifier for SimpleCatelogy + jerryshao + 2014-03-30 10:03:58 -0700 + Commit: 95d7d2a, github.com/apache/spark/pull/272 + + SPARK-1336 Reducing the output of run-tests script. + Prashant Sharma , Prashant Sharma + 2014-03-29 23:03:03 -0700 + Commit: df1b9f7, github.com/apache/spark/pull/262 + + [SQL] SPARK-1354 Fix self-joins of parquet relations + Michael Armbrust + 2014-03-29 22:02:53 -0700 + Commit: 2861b07, github.com/apache/spark/pull/269 + + Don't swallow all kryo errors, only those that indicate we are out of data. + Michael Armbrust + 2014-03-29 22:01:29 -0700 + Commit: 92b8395, github.com/apache/spark/pull/142 + + [SPARK-1186] : Enrich the Spark Shell to support additional arguments. + Bernardo Gomez Palacio + 2014-03-29 19:49:22 -0700 + Commit: fda86d8, github.com/apache/spark/pull/116 + + Implement the RLike & Like in catalyst + Cheng Hao + 2014-03-29 15:12:43 -0700 + Commit: af3746c, github.com/apache/spark/pull/224 + + SPARK-1126. spark-app preliminary + Sandy Ryza + 2014-03-29 14:41:36 -0700 + Commit: 1617816, github.com/apache/spark/pull/86 + + SPARK-1345 adding missing dependency on avro for hadoop 0.23 to the new ... + Thomas Graves + 2014-03-28 23:09:29 -0700 + Commit: 3738f24, github.com/apache/spark/pull/263 + + fix path for jar, make sed actually work on OSX + Nick Lanham + 2014-03-28 13:33:35 -0700 + Commit: 75d46be, github.com/apache/spark/pull/264 + + SPARK-1096, a space after comment start style checker. + Prashant Sharma + 2014-03-28 00:21:49 -0700 + Commit: 60abc25, github.com/apache/spark/pull/124 + + Make sed do -i '' on OSX + Nick Lanham + 2014-03-27 22:45:00 -0700 + Commit: 632c322, github.com/apache/spark/pull/258 + + [SPARK-1210] Prevent ContextClassLoader of Actor from becoming ClassLoader of Executo... + Takuya UESHIN + 2014-03-27 22:17:15 -0700 + Commit: 3d89043, github.com/apache/spark/pull/15 + + [SPARK-1268] Adding XOR and AND-NOT operations to spark.util.collection.BitSet + Petko Nikolov + 2014-03-27 15:49:07 -0700 + Commit: 6f986f0, github.com/apache/spark/pull/172 + + SPARK-1335. Also increase perm gen / code cache for scalatest when invoked via Maven build + Sean Owen + 2014-03-27 11:49:11 -0700 + Commit: 53953d0, github.com/apache/spark/pull/253 + + SPARK-1330 removed extra echo from comput_classpath.sh + Thomas Graves + 2014-03-27 11:54:43 -0500 + Commit: 426042a, github.com/apache/spark/pull/241 + + Cut down the granularity of travis tests. + Michael Armbrust + 2014-03-27 08:53:42 -0700 + Commit: 5b2d863, github.com/apache/spark/pull/255 + + [SPARK-1327] GLM needs to check addIntercept for intercept and weights + Xiangrui Meng + 2014-03-26 19:30:20 -0700 + Commit: d679843, github.com/apache/spark/pull/236 + + SPARK-1325. The maven build error for Spark Tools + Sean Owen , witgo + 2014-03-26 18:31:52 -0700 + Commit: 1fa48d9, github.com/apache/spark/pull/240 + + Spark 1095 : Adding explicit return types to all public methods + NirmalReddy , NirmalReddy + 2014-03-26 18:24:55 -0700 + Commit: 3e63d98, github.com/apache/spark/pull/168 + + SPARK-1324: SparkUI Should Not Bind to SPARK_PUBLIC_DNS + Patrick Wendell + 2014-03-26 18:22:15 -0700 + Commit: be6d96c, github.com/apache/spark/pull/231 + + [SQL] Add a custom serializer for maps since they do not have a no-arg constructor. + Michael Armbrust + 2014-03-26 18:19:49 -0700 + Commit: e15e574, github.com/apache/spark/pull/243 + + [SQL] Un-ignore a test that is now passing. + Michael Armbrust + 2014-03-26 18:19:15 -0700 + Commit: 32cbdfd, github.com/apache/spark/pull/244 + + Unified package definition format in Spark SQL + Cheng Lian + 2014-03-26 15:36:18 -0700 + Commit: 345825d, github.com/apache/spark/pull/225 + + SPARK-1322, top in pyspark should sort result in descending order. + Prashant Sharma + 2014-03-26 09:16:37 -0700 + Commit: a0853a3, github.com/apache/spark/pull/235 + + SPARK-1321 Use Guava's top k implementation rather than our BoundedPriorityQueue based implementation + Reynold Xin + 2014-03-26 00:09:44 -0700 + Commit: b859853, github.com/apache/spark/pull/229 + + Initial experimentation with Travis CI configuration + Michael Armbrust + 2014-03-25 19:01:18 -0700 + Commit: 4f7d547, github.com/apache/spark/pull/230 + + Avoid Option while generating call site + witgo , Aaron Davidson + 2014-03-25 13:28:13 -0700 + Commit: 8237df8, github.com/apache/spark/pull/222 + + SPARK-1319: Fix scheduler to account for tasks using > 1 CPUs. + Shivaram Venkataraman + 2014-03-25 13:05:30 -0700 + Commit: f8111ea, github.com/apache/spark/pull/219 + + SPARK-1316. Remove use of Commons IO + Sean Owen + 2014-03-25 10:21:25 -0700 + Commit: 71d4ed2, github.com/apache/spark/pull/226 + + Add more hive compatability tests to whitelist + Michael Armbrust + 2014-03-25 09:57:26 -0700 + Commit: 134ace7, github.com/apache/spark/pull/220 + + SPARK-1286: Make usage of spark-env.sh idempotent + Aaron Davidson + 2014-03-24 22:24:21 -0700 + Commit: 007a733, github.com/apache/spark/pull/184 + + Unify the logic for column pruning, projection, and filtering of table scans. + Michael Armbrust + 2014-03-24 22:15:51 -0700 + Commit: b637f2d, github.com/apache/spark/pull/213 + + SPARK-1128: set hadoop task properties when constructing HadoopRDD + CodingCat , Nan Zhu + 2014-03-24 21:55:03 -0700 + Commit: 5140598, github.com/apache/spark/pull/101 + + SPARK-1094 Support MiMa for reporting binary compatibility accross versions. + Patrick Wendell , Prashant Sharma , Prashant Sharma + 2014-03-24 21:20:23 -0700 + Commit: dc126f2, github.com/apache/spark/pull/207 + + SPARK-1294 Fix resolution of uppercase field names using a HiveContext. + Michael Armbrust + 2014-03-24 19:24:22 -0700 + Commit: 8043b7b, github.com/apache/spark/pull/202 + + HOT FIX: Exclude test files from RAT + Patrick Wendell + 2014-03-24 13:38:07 -0700 + Commit: 56db8a2 + + SPARK-1144 Added license and RAT to check licenses. + Prashant Sharma + 2014-03-24 08:44:12 -0700 + Commit: 21109fb, github.com/apache/spark/pull/125 + + [SPARK-1212] Adding sparse data support and update KMeans + Xiangrui Meng + 2014-03-23 17:34:02 -0700 + Commit: 80c2968, github.com/apache/spark/pull/117 + + Fixed coding style issues in Spark SQL + Cheng Lian + 2014-03-23 15:21:40 -0700 + Commit: 8265dc7, github.com/apache/spark/pull/208 + + [SPARK-1292] In-memory columnar representation for Spark SQL + Cheng Lian , Cheng Lian + 2014-03-23 12:08:55 -0700 + Commit: 57a4379, github.com/apache/spark/pull/205 + + SPARK-1254. Supplemental fix for HTTPS on Maven Central + Sean Owen + 2014-03-23 10:57:01 -0700 + Commit: abf6714, github.com/apache/spark/pull/209 + + Fix to Stage UI to display numbers on progress bar + Emtiaz Ahmed + 2014-03-21 18:05:53 -0700 + Commit: 646e554, github.com/apache/spark/pull/201 + + Add asCode function for dumping raw tree representations. + Michael Armbrust + 2014-03-21 16:54:06 -0700 + Commit: d780983, github.com/apache/spark/pull/200 + + Make SQL keywords case-insensitive + Matei Zaharia + 2014-03-21 16:53:18 -0700 + Commit: dab5439, github.com/apache/spark/pull/193 + + SPARK-1279: Fix improper use of SimpleDateFormat + zsxwing + 2014-03-21 16:07:22 -0700 + Commit: 2c0aa22, github.com/apache/spark/pull/179 + + Add hive test files to repository. Remove download script. + Michael Armbrust + 2014-03-21 15:05:45 -0700 + Commit: 7e17fe6, github.com/apache/spark/pull/199 + + Fix maven jenkins: Add explicit init for required tables in SQLQuerySuite + Michael Armbrust + 2014-03-20 22:31:11 -0700 + Commit: e09139d, github.com/apache/spark/pull/191 + + SPARK-1251 Support for optimizing and executing structured queries + Michael Armbrust , Yin Huai , Reynold Xin , Lian, Cheng , Andre Schumacher , Yin Huai , Timothy Chen , Cheng Lian , Timothy Chen , Henry Cook , Mark Hamstra + 2014-03-20 18:03:20 -0700 + Commit: 9aadcff, github.com/apache/spark/pull/146 + + [Hot Fix #42] Do not stop SparkUI if bind() is not called + Andrew Or + 2014-03-20 14:13:16 -0700 + Commit: ca76423, github.com/apache/spark/pull/188 + + Principal Component Analysis + Reza Zadeh + 2014-03-20 10:39:20 -0700 + Commit: 66a03e5, github.com/apache/spark/pull/88 + + Revert "SPARK-1099:Spark's local mode should probably respect spark.cores.max by default" + Aaron Davidson + 2014-03-19 17:56:48 -0700 + Commit: ffe272d + + SPARK-1099:Spark's local mode should probably respect spark.cores.max by default + qqsun8819 + 2014-03-19 16:33:54 -0700 + Commit: 1678931, github.com/apache/spark/pull/110 + + Added doctest for map function in rdd.py + Jyotiska NK + 2014-03-19 14:04:45 -0700 + Commit: 67fa71c, github.com/apache/spark/pull/177 + + [SPARK-1132] Persisting Web UI through refactoring the SparkListener interface + Andrew Or , andrewor14 + 2014-03-19 13:17:01 -0700 + Commit: 79d07d6, github.com/apache/spark/pull/42 + + Bugfixes/improvements to scheduler + Mridul Muralidharan + 2014-03-19 12:46:55 -0700 + Commit: ab747d3, github.com/apache/spark/pull/159 + + SPARK-1203 fix saving to hdfs from yarn + Thomas Graves + 2014-03-19 08:09:20 -0500 + Commit: 6112270, github.com/apache/spark/pull/173 + + bugfix: Wrong "Duration" in "Active Stages" in stages page + shiyun.wxm + 2014-03-19 01:42:34 -0700 + Commit: d55ec86, github.com/apache/spark/pull/170 + + Bundle tachyon: SPARK-1269 + Nick Lanham + 2014-03-18 22:04:57 -0700 + Commit: a18ea00, github.com/apache/spark/pull/137 + + Fix SPARK-1256: Master web UI and Worker web UI returns a 404 error + witgo + 2014-03-18 21:57:47 -0700 + Commit: cc2655a, github.com/apache/spark/pull/150 + + [SPARK-1266] persist factors in implicit ALS + Xiangrui Meng + 2014-03-18 17:20:42 -0700 + Commit: f9d8a83, github.com/apache/spark/pull/165 + + [SPARK-1260]: faster construction of features with intercept + Xiangrui Meng + 2014-03-18 15:14:13 -0700 + Commit: e108b9a, github.com/apache/spark/pull/161 + + Update copyright year in NOTICE to 2014 + Matei Zaharia + 2014-03-18 14:34:31 -0700 + Commit: 79e547f, github.com/apache/spark/pull/174 + + SPARK-1102: Create a saveAsNewAPIHadoopDataset method + CodingCat + 2014-03-18 11:06:18 -0700 + Commit: 2fa26ec, github.com/apache/spark/pull/12 + + Revert "SPARK-1236 - Upgrade Jetty to 9.1.3.v20140225." + Patrick Wendell + 2014-03-18 00:46:03 -0700 + Commit: e7423d4, github.com/apache/spark/pull/167 + + Spark 1246 add min max to stat counter + Dan McClary + 2014-03-18 00:45:47 -0700 + Commit: e3681f2, github.com/apache/spark/pull/144 + + [Spark-1261] add instructions for running python examples to doc overview page + Diana Carroll + 2014-03-17 17:35:51 -0700 + Commit: 087eedc, github.com/apache/spark/pull/162 + + SPARK-1244: Throw exception if map output status exceeds frame size + Patrick Wendell , Andrew Or + 2014-03-17 14:03:32 -0700 + Commit: 796977a, github.com/apache/spark/pull/152 + + SPARK-1240: handle the case of empty RDD when takeSample + CodingCat + 2014-03-16 22:14:59 -0700 + Commit: dc96546, github.com/apache/spark/pull/135 + + SPARK-1255: Allow user to pass Serializer object instead of class name for shuffle. + Reynold Xin + 2014-03-16 09:57:21 -0700 + Commit: f5486e9, github.com/apache/spark/pull/149 + + SPARK-1254. Consolidate, order, and harmonize repository declarations in Maven/SBT builds + Sean Owen + 2014-03-15 16:43:27 -0700 + Commit: 97e4459, github.com/apache/spark/pull/145 + + Fix serialization of MutablePair. Also provide an interface for easy updating. + Michael Armbrust + 2014-03-14 11:40:26 -0700 + Commit: e19044c, github.com/apache/spark/pull/141 + + [bugfix] wrong client arg, should use executor-cores + Tianshuo Deng + 2014-03-13 20:27:36 -0700 + Commit: 181b130, github.com/apache/spark/pull/138 + + SPARK-1236 - Upgrade Jetty to 9.1.3.v20140225. + Reynold Xin + 2014-03-13 12:16:04 -0700 + Commit: ca4bf8c, github.com/apache/spark/pull/113 + + SPARK-1183. Don't use "worker" to mean executor + Sandy Ryza + 2014-03-13 12:11:33 -0700 + Commit: 6983732, github.com/apache/spark/pull/120 + + [SPARK-1237, 1238] Improve the computation of YtY for implicit ALS + Xiangrui Meng + 2014-03-13 00:43:19 -0700 + Commit: e4e8d8f, github.com/apache/spark/pull/131 + + SPARK-1019: pyspark RDD take() throws an NPE + Patrick Wendell + 2014-03-12 23:16:59 -0700 + Commit: 4ea23db, github.com/apache/spark/pull/112 + + hot fix for PR105 - change to Java annotation + CodingCat + 2014-03-12 19:49:18 -0700 + Commit: 6bd2eaa, github.com/apache/spark/pull/133 + + Fix example bug: compile error + jianghan + 2014-03-12 19:46:12 -0700 + Commit: 31a7040, github.com/apache/spark/pull/132 + + SPARK-1160: Deprecate toArray in RDD + CodingCat + 2014-03-12 17:43:12 -0700 + Commit: 9032f7c, github.com/apache/spark/pull/105 + + SPARK-1162 Added top in python. + Prashant Sharma + 2014-03-12 15:57:44 -0700 + Commit: b8afe30, github.com/apache/spark/pull/93 + + Fix #SPARK-1149 Bad partitioners can cause Spark to hang + liguoqiang + 2014-03-12 12:59:51 -0700 + Commit: 5d1ec64, github.com/apache/spark/pull/44 + + [SPARK-1233] Fix running hadoop 0.23 due to java.lang.NoSuchFieldException: DEFAULT_M... + Thomas Graves + 2014-03-12 11:25:41 -0700 + Commit: b5162f4, github.com/apache/spark/pull/129 + + [SPARK-1232] Fix the hadoop 0.23 yarn build + Thomas Graves + 2014-03-12 10:32:01 -0700 + Commit: c8c59b3, github.com/apache/spark/pull/127 + + Spark-1163, Added missing Python RDD functions + prabinb + 2014-03-11 23:57:05 -0700 + Commit: af7f2f1, github.com/apache/spark/pull/92 + + SPARK-1064 + Sandy Ryza + 2014-03-11 22:39:17 -0700 + Commit: 2409af9, github.com/apache/spark/pull/102 + + SPARK-1167: Remove metrics-ganglia from default build due to LGPL issues... + Patrick Wendell + 2014-03-11 11:16:59 -0700 + Commit: 16788a6, github.com/apache/spark/pull/108 + + SPARK-1211. In ApplicationMaster, set spark.master system property to "y... + Sandy Ryza + 2014-03-10 17:42:33 -0700 + Commit: 2a2c964, github.com/apache/spark/pull/118 + + SPARK-1205: Clean up callSite/origin/generator. + Patrick Wendell + 2014-03-10 16:28:41 -0700 + Commit: 2a51617, github.com/apache/spark/pull/106 + + SPARK-1168, Added foldByKey to pyspark. + Prashant Sharma + 2014-03-10 13:37:11 -0700 + Commit: a59419c, github.com/apache/spark/pull/115 + + [SPARK-972] Added detailed callsite info for ValueError in context.py (resubmitted) + jyotiska + 2014-03-10 13:34:49 -0700 + Commit: f551898, github.com/apache/spark/pull/34 + + SPARK-977 Added Python RDD.zip function + Prabin Banka + 2014-03-10 13:27:00 -0700 + Commit: e1e09e0, github.com/apache/spark/pull/76 + + maintain arbitrary state data for each key + Chen Chao + 2014-03-09 22:42:12 -0700 + Commit: 5d98cfc, github.com/apache/spark/pull/114 + + SPARK-782 Clean up for ASM dependency. + Patrick Wendell + 2014-03-09 13:17:07 -0700 + Commit: b9be160, github.com/apache/spark/pull/100 + + Fix markup errors introduced in #33 (SPARK-1189) + Patrick Wendell + 2014-03-09 11:57:06 -0700 + Commit: faf4cad, github.com/apache/spark/pull/111 + + Add timeout for fetch file + Jiacheng Guo + 2014-03-09 11:37:44 -0700 + Commit: f6f9d02, github.com/apache/spark/pull/98 + + SPARK-929: Fully deprecate usage of SPARK_MEM + Aaron Davidson + 2014-03-09 11:08:39 -0700 + Commit: 52834d7, github.com/apache/spark/pull/99 + + SPARK-1190: Do not initialize log4j if slf4j log4j backend is not being used + Patrick Wendell + 2014-03-08 16:02:42 -0800 + Commit: e59a3b6, github.com/apache/spark/pull/107 + + Update junitxml plugin to the latest version to avoid recompilation in every SBT command. + Reynold Xin + 2014-03-08 12:40:26 -0800 + Commit: c2834ec, github.com/apache/spark/pull/104 + + [SPARK-1194] Fix the same-RDD rule for cache replacement + Cheng Lian + 2014-03-07 23:26:46 -0800 + Commit: 0b7b7fd, github.com/apache/spark/pull/96 + + Allow sbt to use more than 1G of heap. + Reynold Xin + 2014-03-07 23:23:59 -0800 + Commit: 8ad486a, github.com/apache/spark/pull/103 + + SPARK-1193. Fix indentation in pom.xmls + Sandy Ryza + 2014-03-07 23:10:35 -0800 + Commit: a99fb37, github.com/apache/spark/pull/91 + + Spark 1165 rdd.intersection in python and java + Prashant Sharma , Prashant Sharma + 2014-03-07 18:48:07 -0800 + Commit: 6e730ed, github.com/apache/spark/pull/80 + + SPARK-1195: set map_input_file environment variable in PipedRDD + Thomas Graves + 2014-03-07 10:36:55 -0800 + Commit: b7cd9e9, github.com/apache/spark/pull/94 + + SPARK-1136: Fix FaultToleranceTest for Docker 0.8.1 + Aaron Davidson + 2014-03-07 10:22:27 -0800 + Commit: dabeb6f, github.com/apache/spark/pull/5 + + Small clean-up to flatmap tests + Patrick Wendell + 2014-03-06 17:57:31 -0800 + Commit: 33baf14 + + Example for cassandra CQL read/write from spark + anitatailor + 2014-03-06 17:46:43 -0800 + Commit: 9ae919c, github.com/apache/spark/pull/87 + + SPARK-1197. Change yarn-standalone to yarn-cluster and fix up running on YARN docs + Sandy Ryza + 2014-03-06 17:12:58 -0800 + Commit: 328c73d, github.com/apache/spark/pull/95 + + SPARK-1189: Add Security to Spark - Akka, Http, ConnectionManager, UI use servlets + Thomas Graves + 2014-03-06 18:27:50 -0600 + Commit: 7edbea4, github.com/apache/spark/pull/33 + + SPARK-942: Do not materialize partitions when DISK_ONLY storage level is used + Kyle Ellrott + 2014-03-06 14:51:00 -0800 + Commit: 40566e1, github.com/apache/spark/pull/50 + + SPARK-1187, Added missing Python APIs + Prabin Banka + 2014-03-06 12:45:27 -0800 + Commit: 3d3acef, github.com/apache/spark/pull/75 + + SPARK-1156: allow user to login into a cluster without slaves + CodingCat + 2014-03-05 21:47:34 -0800 + Commit: 3eb009f, github.com/apache/spark/pull/58 + + SPARK-1184: Update the distribution tar.gz to include spark-assembly jar + Mark Grover + 2014-03-05 16:52:58 -0800 + Commit: cda381f, github.com/apache/spark/pull/78 + + Improve building with maven docs + liguoqiang + 2014-03-05 16:38:43 -0800 + Commit: 51ca7bd, github.com/apache/spark/pull/70 + + SPARK-1171: when executor is removed, we should minus totalCores instead of just freeCores on that executor + CodingCat , Nan Zhu + 2014-03-05 14:00:28 -0800 + Commit: a3da508, github.com/apache/spark/pull/63 + + SPARK-1109 wrong API docs for pyspark map function + Prashant Sharma + 2014-03-04 15:32:43 -0800 + Commit: 0283665, github.com/apache/spark/pull/73 + + SPARK-1178: missing document of spark.scheduler.revive.interval + CodingCat + 2014-03-04 10:28:17 -0800 + Commit: 1865dd6, github.com/apache/spark/pull/74 + + SPARK-1164 Deprecated reduceByKeyToDriver as it is an alias for reduceByKeyLocally + Prashant Sharma + 2014-03-04 10:27:02 -0800 + Commit: 2d8e0a0, github.com/apache/spark/pull/72 + + [java8API] SPARK-964 Investigate the potential for using JDK 8 lambda expressions for the Java/Scala APIs + Prashant Sharma , Patrick Wendell + 2014-03-03 22:31:30 -0800 + Commit: 181ec50, github.com/apache/spark/pull/17 + + Remove broken/unused Connection.getChunkFIFO method. + Kay Ousterhout + 2014-03-03 21:27:18 -0800 + Commit: b14ede7, github.com/apache/spark/pull/69 + + SPARK-1158: Fix flaky RateLimitedOutputStreamSuite. + Reynold Xin + 2014-03-03 21:24:19 -0800 + Commit: f5ae38a, github.com/apache/spark/pull/55 + + Added a unit test for PairRDDFunctions.lookup + Bryn Keller + 2014-03-03 16:38:57 -0800 + Commit: 923dba5, github.com/apache/spark/pull/36 + + Remove the remoteFetchTime metric. + Kay Ousterhout + 2014-03-03 16:12:00 -0800 + Commit: b55cade, github.com/apache/spark/pull/62 + + update proportion of memory + Chen Chao + 2014-03-03 14:41:25 -0800 + Commit: 9d225a9, github.com/apache/spark/pull/66 + + Removed accidentally checked in comment + Kay Ousterhout + 2014-03-03 14:39:49 -0800 + Commit: 369aad6, github.com/apache/spark/pull/61 + + SPARK-1173. (#2) Fix typo in Java streaming example. + Aaron Kimball + 2014-03-02 23:48:48 -0800 + Commit: f65c1f3, github.com/apache/spark/pull/65 + + SPARK-1173. Improve scala streaming docs. + Aaron Kimball + 2014-03-02 23:26:47 -0800 + Commit: 2b53447, github.com/apache/spark/pull/64 + + Add Jekyll tag to isolate "production-only" doc components. + Patrick Wendell + 2014-03-02 18:19:01 -0800 + Commit: 55a4f11, github.com/apache/spark/pull/56 + + SPARK-1121: Include avro for yarn-alpha builds + Patrick Wendell + 2014-03-02 15:18:19 -0800 + Commit: c3f5e07, github.com/apache/spark/pull/49 + + SPARK-1084.2 (resubmitted) + Sean Owen + 2014-03-02 14:27:53 -0800 + Commit: fd31adb, github.com/apache/spark/pull/32 + + Ignore RateLimitedOutputStreamSuite for now. + Reynold Xin + 2014-03-02 14:27:19 -0800 + Commit: 353ac6b, github.com/apache/spark/pull/54 + + SPARK-1137: Make ZK PersistenceEngine not crash for wrong serialVersionUID + Aaron Davidson + 2014-03-02 01:00:42 -0800 + Commit: 46bcb95, github.com/apache/spark/pull/4 + + Remove remaining references to incubation + Patrick Wendell + 2014-03-02 01:00:16 -0800 + Commit: 1fd2bfd, github.com/apache/spark/pull/51 + + Update io.netty from 4.0.13 Final to 4.0.17.Final + Binh Nguyen , Binh Nguyen + 2014-03-02 00:48:50 -0800 + Commit: b70823c, github.com/apache/spark/pull/41 + + Merge the old sbt-launch-lib.bash with the new sbt-launcher jar downloading logic. + Michael Armbrust + 2014-03-02 00:35:23 -0800 + Commit: 012bd5f, github.com/apache/spark/pull/14 + + Initialized the regVal for first iteration in SGD optimizer + DB Tsai + 2014-03-02 00:31:59 -0800 + Commit: 6fc76e4, github.com/apache/spark/pull/40 + + [SPARK-1100] prevent Spark from overwriting directory silently + CodingCat + 2014-03-01 17:27:54 -0800 + Commit: 3a8b698, github.com/apache/spark/pull/11 + + [SPARK-1150] fix repo location in create script (re-open) + CodingCat + 2014-03-01 17:24:53 -0800 + Commit: fe195ae, github.com/apache/spark/pull/52 + + Revert "[SPARK-1150] fix repo location in create script" + Patrick Wendell + 2014-03-01 17:15:38 -0800 + Commit: ec992e1 + + [SPARK-1150] fix repo location in create script + Mark Grover + 2014-03-01 16:21:22 -0800 + Commit: 9aa0957, github.com/apache/spark/pull/48 + + [SPARK-979] Randomize order of offers. + Kay Ousterhout + 2014-03-01 11:24:22 -0800 + Commit: 556c566, github.com/apache/spark/pull/27 + + SPARK-1151: Update dev merge script to use spark.git instead of incubator-spark + Thomas Graves + 2014-02-28 18:28:33 -0800 + Commit: 4ba3f70, github.com/apache/spark/pull/47 + + SPARK-1051. On YARN, executors don't doAs submitting user + Sandy Ryza + 2014-02-28 12:43:01 -0600 + Commit: 46dff34, github.com/apache/spark/pull/29 + + SPARK-1032. If Yarn app fails before registering, app master stays aroun... + Sandy Ryza + 2014-02-28 09:40:47 -0600 + Commit: 5f419bf, github.com/apache/spark/pull/28 + + Remote BlockFetchTracker trait + Kay Ousterhout + 2014-02-27 21:52:55 -0800 + Commit: edf8a56, github.com/apache/spark/pull/39 + + Removed reference to incubation in Spark user docs. + Reynold Xin + 2014-02-27 21:13:22 -0800 + Commit: 40e080a, github.com/apache/spark/pull/2 + + [HOTFIX] Patching maven build after #6 (SPARK-1121). + Patrick Wendell + 2014-02-27 15:06:20 -0800 + Commit: c42557b, github.com/apache/spark/pull/37 + + SPARK 1084.1 (resubmitted) + Sean Owen + 2014-02-27 11:12:21 -0800 + Commit: 12bbca2, github.com/apache/spark/pull/31 + + Show Master status on UI page + Raymond Liu + 2014-02-26 23:51:32 -0800 + Commit: aace2c0, github.com/apache/spark/pull/24 + + [SPARK-1089] fix the regression problem on ADD_JARS in 0.9 + CodingCat + 2014-02-26 23:42:15 -0800 + Commit: 345df5f, github.com/apache/spark/pull/13 + + SPARK-1121 Only add avro if the build is for Hadoop 0.23.X and SPARK_YARN is set + Prashant Sharma + 2014-02-26 23:40:49 -0800 + Commit: 6ccd6c5, github.com/apache/spark/pull/6 + + SPARK-1129: use a predefined seed when seed is zero in XORShiftRandom + Xiangrui Meng + 2014-02-26 23:22:30 -0800 + Commit: 5a3ad10, github.com/apache/spark/pull/645 + + Remove references to ClusterScheduler (SPARK-1140) + Kay Ousterhout + 2014-02-26 22:52:42 -0800 + Commit: 71f69d6, github.com/apache/spark/pull/9 + + Updated link for pyspark examples in docs + Jyotiska NK + 2014-02-26 21:37:04 -0800 + Commit: 2645035, github.com/apache/spark/pull/22 + + Deprecated and added a few java api methods for corresponding scala api. + Prashant Sharma + 2014-02-26 21:17:44 -0800 + Commit: 0e40e2b, github.com/apache/spark/pull/19 + + Removed reference to incubation in README.md. + Reynold Xin + 2014-02-26 16:52:26 -0800 + Commit: 84f7ca1, github.com/apache/spark/pull/1 + + SPARK-1115: Catch depickling errors + Bouke van der Bijl + 2014-02-26 14:50:37 -0800 + Commit: 12738c1, github.com/apache/spark/pull/644 + + SPARK-1135: fix broken anchors in docs + Matei Zaharia + 2014-02-26 11:20:16 -0800 + Commit: c86eec5, github.com/apache/spark/pull/3 + + SPARK-1078: Replace lift-json with json4s-jackson. + William Benton + 2014-02-26 10:09:50 -0800 + Commit: fbedc8e, github.com/apache/spark/pull/582 + + SPARK-1053. Don't require SPARK_YARN_APP_JAR + Sandy Ryza + 2014-02-26 10:00:02 -0600 + Commit: b8a1871, github.com/apache/spark/pull/553 + + For SPARK-1082, Use Curator for ZK interaction in standalone cluster + Raymond Liu + 2014-02-24 23:20:38 -0800 + Commit: c852201, github.com/apache/incubator-spark/pull/611 + + Graph primitives2 + Semih Salihoglu + 2014-02-24 22:42:30 -0800 + Commit: 1f4c7f7, github.com/apache/incubator-spark/pull/580 + + Include reference to twitter/chill in tuning docs + Andrew Ash + 2014-02-24 21:13:38 -0800 + Commit: a4f4fbc, github.com/apache/incubator-spark/pull/647 + + For outputformats that are Configurable, call setConf before sending data to them. + Bryn Keller + 2014-02-24 17:35:22 -0800 + Commit: 4d88030, github.com/apache/incubator-spark/pull/638 + + d8d190e 2014-02-24 16:58:57 -0800 + Merge pull request #641 from mateiz/spark-1124-master + [SPARK-1124: Fix infinite retries of reduce stage when a map stage failed] + + Fix removal from shuffleToMapStage to search for a key-value pair with our stage instead of using our shuffleID. + Matei Zaharia + 2014-02-24 13:14:56 -0800 + Commit: 0187cef + + SPARK-1124: Fix infinite retries of reduce stage when a map stage failed + Matei Zaharia + 2014-02-23 23:45:48 -0800 + Commit: cd32d5e + + SPARK-1071: Tidy logging strategy and use of log4j + Sean Owen + 2014-02-23 11:40:55 -0800 + Commit: c0ef3af, github.com/apache/incubator-spark/pull/570 + + [SPARK-1041] remove dead code in start script, remind user to set that in spark-env.sh + CodingCat + 2014-02-22 20:21:15 -0800 + Commit: 437b62f, github.com/apache/incubator-spark/pull/588 + + Migrate Java code to Scala or move it to src/main/java + Punya Biswal + 2014-02-22 17:53:48 -0800 + Commit: 29ac7ea, github.com/apache/incubator-spark/pull/605 + + [SPARK-1055] fix the SCALA_VERSION and SPARK_VERSION in docker file + CodingCat , Nan Zhu + 2014-02-22 15:39:25 -0800 + Commit: 1aa4f8a, github.com/apache/incubator-spark/pull/634 + + doctest updated for mapValues, flatMapValues in rdd.py + jyotiska + 2014-02-22 15:10:31 -0800 + Commit: 722199f, github.com/apache/incubator-spark/pull/621 + + Fixed minor typo in worker.py + jyotiska + 2014-02-22 10:09:50 -0800 + Commit: 3ff077d, github.com/apache/incubator-spark/pull/630 + + SPARK-1117: update accumulator docs + Xiangrui Meng + 2014-02-21 22:44:45 -0800 + Commit: aaec7d4, github.com/apache/incubator-spark/pull/631 + + [SPARK-1113] External spilling - fix Int.MaxValue hash code collision bug + Andrew Or + 2014-02-21 20:05:39 -0800 + Commit: fefd22f, github.com/apache/incubator-spark/pull/624 + + MLLIB-25: Implicit ALS runs out of memory for moderately large numbers of features + Sean Owen + 2014-02-21 12:46:12 -0800 + Commit: c8a4c9b, github.com/apache/incubator-spark/pull/629 + + SPARK-1111: URL Validation Throws Error for HDFS URL's + Patrick Wendell + 2014-02-21 11:11:55 -0800 + Commit: 45b15e2, github.com/apache/incubator-spark/pull/625 + + SPARK-1114: Allow PySpark to use existing JVM and Gateway + Ahir Reddy + 2014-02-20 21:20:39 -0800 + Commit: 59b1379, github.com/apache/incubator-spark/pull/622 + + Super minor: Add require for mergeCombiners in combineByKey + Aaron Davidson + 2014-02-20 16:46:13 -0800 + Commit: 3fede48, github.com/apache/incubator-spark/pull/623 + + MLLIB-22. Support negative implicit input in ALS + Sean Owen + 2014-02-19 23:44:53 -0800 + Commit: 9e63f80, github.com/apache/incubator-spark/pull/500 + + MLLIB-24: url of "Collaborative Filtering for Implicit Feedback Datasets" in ALS is invalid now + Chen Chao + 2014-02-19 22:06:35 -0800 + Commit: f9b7d64, github.com/apache/incubator-spark/pull/619 + + [SPARK-1105] fix site scala version error in docs + CodingCat + 2014-02-19 15:54:03 -0800 + Commit: 7b012c9, github.com/apache/incubator-spark/pull/618 + + SPARK-1106: check key name and identity file before launch a cluster + Xiangrui Meng + 2014-02-18 18:30:02 -0800 + Commit: b61435c, github.com/apache/incubator-spark/pull/617 + + Revert "[SPARK-1105] fix site scala version error in doc" + Patrick Wendell + 2014-02-18 17:46:47 -0800 + Commit: d9bb32a + + [SPARK-1105] fix site scala version error in doc + CodingCat + 2014-02-18 16:29:23 -0800 + Commit: d99773d, github.com/apache/incubator-spark/pull/616 + + Optimized imports + NirmalReddy , NirmalReddy + 2014-02-18 14:44:36 -0800 + Commit: ccb327a, github.com/apache/incubator-spark/pull/613 + + SPARK-1098: Minor cleanup of ClassTag usage in Java API + Aaron Davidson + 2014-02-17 19:23:27 -0800 + Commit: f74ae0e, github.com/apache/incubator-spark/pull/604 + + [SPARK-1090] improvement on spark_shell (help information, configure memory) + CodingCat + 2014-02-17 15:12:52 -0800 + Commit: e0d49ad, github.com/apache/incubator-spark/pull/599 + + Fix typos in Spark Streaming programming guide + Andrew Or + 2014-02-17 10:59:02 -0800 + Commit: 767e3ae, github.com/apache/incubator-spark/pull/536 + + Worker registration logging fix + Andrew Ash + 2014-02-17 09:51:55 -0800 + Commit: c0795cf, github.com/apache/incubator-spark/pull/608 + + Add subtractByKey to the JavaPairRDD wrapper + Punya Biswal + 2014-02-16 18:55:59 -0800 + Commit: 5af4477, github.com/apache/incubator-spark/pull/600 + + fix for https://spark-project.atlassian.net/browse/SPARK-1052 + Bijay Bisht + 2014-02-16 16:52:57 -0800 + Commit: 73cfdcf, github.com/apache/incubator-spark/pull/568 + + [SPARK-1092] print warning information if user use SPARK_MEM to regulate executor memory usage + CodingCat + 2014-02-16 12:25:38 -0800 + Commit: 1cad381, github.com/apache/incubator-spark/pull/602 + + Typo: Standlone -> Standalone + Andrew Ash + 2014-02-14 10:01:01 -0800 + Commit: eec4bd1, github.com/apache/incubator-spark/pull/601 + + 2414ed3 2014-02-13 14:26:06 -0800 + Merge pull request #598 from shivaram/master. + [Update spark_ec2 to use 0.9.0 by default] + + Add c3 instance types to Spark EC2 + Christian Lundgren + 2014-02-13 12:44:21 -0800 + Commit: 5fa53c0, github.com/apache/incubator-spark/pull/595 + + Ported hadoopClient jar for < 1.0.1 fix + Bijay Bisht + 2014-02-12 23:42:10 -0800 + Commit: a3bb861, github.com/apache/incubator-spark/pull/584 + + SPARK-1073 Keep GitHub pull request title as commit summary + Andrew Ash + 2014-02-12 23:23:06 -0800 + Commit: 6ee0ad8, github.com/apache/incubator-spark/pull/574 + + 7fe7a55 2014-02-12 22:35:09 -0800 + Merge pull request #592 from rxin/test. + [SPARK-1088: Create a script for running tests so we can have version specific testing on Jenkins.] + + 7e29e02 2014-02-12 16:26:25 -0800 + Merge pull request #591 from mengxr/transient-new. + [SPARK-1076: [Fix #578] add @transient to some vals] + + 2bea070 2014-02-12 10:47:52 -0800 + Merge pull request #589 from mengxr/index. + [SPARK-1076: Convert Int to Long to avoid overflow] + + e733d65 2014-02-12 00:42:42 -0800 + Merge pull request #578 from mengxr/rank. + [SPARK-1076: zipWithIndex and zipWithUniqueId to RDD] + + 68b2c0d 2014-02-11 22:39:48 -0800 + Merge pull request #583 from colorant/zookeeper. + [Minor fix for ZooKeeperPersistenceEngine to use configured working dir] + + b0dab1b 2014-02-11 14:48:59 -0800 + Merge pull request #571 from holdenk/switchtobinarysearch. + [SPARK-1072 Use binary search when needed in RangePartioner] + + ba38d98 2014-02-11 14:46:22 -0800 + Merge pull request #577 from hsaputra/fix_simple_streaming_doc. + [SPARK-1075 Fix doc in the Spark Streaming custom receiver closing bracket in the class constructor] + + 4afe6cc 2014-02-10 22:28:39 -0800 + Merge pull request #579 from CrazyJvm/patch-1. + ["in the source DStream" rather than "int the source DStream"] + + d6a9bdc 2014-02-09 23:35:06 -0800 + Revert "Merge pull request #560 from pwendell/logging. Closes #560." + [This reverts commit b6d40b782327188a25ded5b22790552121e5271f.] + + 919bd7f 2014-02-09 22:17:52 -0800 + Merge pull request #567 from ScrapCodes/style2. + [SPARK-1058, Fix Style Errors and Add Scala Style to Spark Build. Pt 2] + + 2182aa3 2014-02-09 15:19:50 -0800 + Merge pull request #566 from martinjaggi/copy-MLlib-d. + [new MLlib documentation for optimization, regression and classification] + + afc8f3c 2014-02-09 13:57:29 -0800 + Merge pull request #551 from qqsun8819/json-protocol. + [[SPARK-1038] Add more fields in JsonProtocol and add tests that verify the JSON itself] + + 94ccf86 2014-02-09 13:54:27 -0800 + Merge pull request #569 from pwendell/merge-fixes. + [Fixes bug where merges won't close associated pull request.] + + b69f8b2 2014-02-09 10:09:19 -0800 + Merge pull request #557 from ScrapCodes/style. Closes #557. + [SPARK-1058, Fix Style Errors and Add Scala Style to Spark Build.] + + b6dba10 2014-02-08 23:39:17 -0800 + Merge pull request #556 from CodingCat/JettyUtil. Closes #556. + [[SPARK-1060] startJettyServer should explicitly use IP information] + + 2ef37c9 2014-02-08 23:36:48 -0800 + Merge pull request #562 from jyotiska/master. Closes #562. + [Added example Python code for sort] + + b6d40b7 2014-02-08 23:35:31 -0800 + Merge pull request #560 from pwendell/logging. Closes #560. + [[WIP] SPARK-1067: Default log4j initialization causes errors for those not using log4j] + + f892da8 2014-02-08 23:13:34 -0800 + Merge pull request #565 from pwendell/dev-scripts. Closes #565. + [SPARK-1066: Add developer scripts to repository.] + + c2341c9 2014-02-08 16:00:43 -0800 + Merge pull request #542 from markhamstra/versionBump. Closes #542. + [Version number to 1.0.0-SNAPSHOT] + + f0ce736 2014-02-08 12:59:48 -0800 + Merge pull request #561 from Qiuzhuang/master. Closes #561. + [Kill drivers in postStop() for Worker.] + + 7805080 2014-02-08 12:24:08 -0800 + Merge pull request #454 from jey/atomic-sbt-download. Closes #454. + [Make sbt download an atomic operation] + + fabf174 2014-02-08 11:39:13 -0800 + Merge pull request #552 from martinjaggi/master. Closes #552. + [tex formulas in the documentation] + + 3a9d82c 2014-02-06 22:38:36 -0800 + Merge pull request #506 from ash211/intersection. Closes #506. + [SPARK-1062 Add rdd.intersection(otherRdd) method] + + 1896c6e 2014-02-06 22:05:53 -0800 + Merge pull request #533 from andrewor14/master. Closes #533. + [External spilling - generalize batching logic] + + 0b448df 2014-02-06 16:15:24 -0800 + Merge pull request #450 from kayousterhout/fetch_failures. Closes #450. + [Only run ResubmitFailedStages event after a fetch fails] + + 18ad59e 2014-02-06 16:10:48 -0800 + Merge pull request #321 from kayousterhout/ui_kill_fix. Closes #321. + [Inform DAG scheduler about all started/finished tasks.] + + 446403b 2014-02-06 15:41:16 -0800 + Merge pull request #554 from sryza/sandy-spark-1056. Closes #554. + [SPARK-1056. Fix header comment in Executor to not imply that it's only u...] + + 084839b 2014-02-06 14:58:35 -0800 + Merge pull request #498 from ScrapCodes/python-api. Closes #498. + [Python api additions] + + 79c9552 2014-02-05 23:38:12 -0800 + Merge pull request #545 from kayousterhout/fix_progress. Closes #545. + [Fix off-by-one error with task progress info log.] + + 3802096 2014-02-05 23:37:07 -0800 + Merge pull request #526 from tgravescs/yarn_client_stop_am_fix. Closes #526. + [spark on yarn - yarn-client mode doesn't always exit immediately] + + 18c4ee7 2014-02-05 22:08:47 -0800 + Merge pull request #549 from CodingCat/deadcode_master. Closes #549. + [remove actorToWorker in master.scala, which is actually not used] + + cc14ba9 2014-02-05 12:44:24 -0800 + Merge pull request #544 from kayousterhout/fix_test_warnings. Closes #544. + [Fixed warnings in test compilation.] + + f7fd80d 2014-02-05 10:29:45 -0800 + Merge pull request #540 from sslavic/patch-3. Closes #540. + [Fix line end character stripping for Windows] + + 9209287 2014-02-04 09:47:11 -0800 + Merge pull request #534 from sslavic/patch-1. Closes #534. + [Fixed wrong path to compute-classpath.cmd] + + 0c05cd3 2014-02-04 09:45:46 -0800 + Merge pull request #535 from sslavic/patch-2. Closes #535. + [Fixed typo in scaladoc] + + 23af00f 2014-02-03 13:02:09 -0800 + Merge pull request #528 from mengxr/sample. Closes #528. + [ Refactor RDD sampling and add randomSplit to RDD (update)] + + 1625d8c 2014-02-03 11:25:39 -0800 + Merge pull request #530 from aarondav/cleanup. Closes #530. + [Remove explicit conversion to PairRDDFunctions in cogroup()] + + 0386f42 2014-02-02 21:51:17 -0800 + Merge pull request #529 from hsaputra/cleanup_right_arrowop_scala + [Change the ⇒ character (maybe from scalariform) to => in Scala code for style consistency] + + a8cf3ec 2014-01-31 16:52:02 -0800 + Merge pull request #527 from ankurdave/graphx-assembly-pom + [Add GraphX to assembly/pom.xml] + + ac712e4 2014-01-30 09:33:18 -0800 + Merge pull request #524 from rxin/doc + [Added spark.shuffle.file.buffer.kb to configuration doc.] + + 0ff38c2 2014-01-29 12:44:54 -0800 + Merge pull request #494 from tyro89/worker_registration_issue + [Issue with failed worker registrations] + + 7930209 2014-01-28 21:51:05 -0800 + Merge pull request #497 from tdas/docs-update + [Updated Spark Streaming Programming Guide] + + f8c742c 2014-01-28 21:30:20 -0800 + Merge pull request #523 from JoshRosen/SPARK-1043 + [Switch from MUTF8 to UTF8 in PySpark serializers.] + + Switch from MUTF8 to UTF8 in PySpark serializers. + Josh Rosen + 2014-01-28 19:50:26 -0800 + Commit: 1381fc7 + + 84670f2 2014-01-27 17:08:35 -0800 + Merge pull request #466 from liyinan926/file-overwrite-new + [Allow files added through SparkContext.addFile() to be overwritten] + + 3d5c03e 2014-01-27 16:27:01 -0800 + Merge pull request #516 from sarutak/master + [modified SparkPluginBuild.scala to use https protocol for accessing gith...] + + f16c21e 2014-01-27 14:24:06 -0800 + Merge pull request #490 from hsaputra/modify_checkoption_with_isdefined + [Replace the check for None Option with isDefined and isEmpty in Scala code] + + f67ce3e 2014-01-27 11:15:51 -0800 + Merge pull request #460 from srowen/RandomInitialALSVectors + [Choose initial user/item vectors uniformly on the unit sphere] + + modified SparkPluginBuild.scala to use https protocol for accessing github. + sarutak + 2014-01-27 17:00:26 +0900 + Commit: 6a5af7b + + c40619d 2014-01-25 22:41:30 -0800 + Merge pull request #504 from JoshRosen/SPARK-1025 + [Fix PySpark hang when input files are deleted (SPARK-1025)] + + c66a2ef 2014-01-25 22:36:07 -0800 + Merge pull request #511 from JoshRosen/SPARK-1040 + [Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040)] + + Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040) + Josh Rosen + 2014-01-25 16:39:20 -0800 + Commit: 740e865 + + Increase JUnit test verbosity under SBT. + Josh Rosen + 2014-01-25 16:32:44 -0800 + Commit: 531d9d7 + + 05be704 2014-01-23 20:53:18 -0800 + Merge pull request #505 from JoshRosen/SPARK-1026 + [Deprecate mapPartitionsWithSplit in PySpark (SPARK-1026)] + + Deprecate mapPartitionsWithSplit in PySpark. + Josh Rosen + 2014-01-23 20:01:36 -0800 + Commit: 4cebb79 + + 3d6e754 2014-01-23 19:47:00 -0800 + Merge pull request #503 from pwendell/master + [Fix bug on read-side of external sort when using Snappy.] + + Minor fix + Patrick Wendell + 2014-01-23 19:23:12 -0800 + Commit: ff44732 + + c319617 2014-01-23 19:11:59 -0800 + Merge pull request #502 from pwendell/clone-1 + [Remove Hadoop object cloning and warn users making Hadoop RDD's.] + + cad3002 2014-01-23 19:08:34 -0800 + Merge pull request #501 from JoshRosen/cartesian-rdd-fixes + [Fix two bugs in PySpark cartesian(): SPARK-978 and SPARK-1034] + + Minor changes after auditing diff from earlier version + Patrick Wendell + 2014-01-23 18:30:11 -0800 + Commit: 268ecbd + + Fix for SPARK-1025: PySpark hang on missing files. + Josh Rosen + 2014-01-23 18:10:16 -0800 + Commit: f830684 + + Response to Matei's review + Patrick Wendell + 2014-01-23 18:12:40 -0800 + Commit: c58d4ea + + Fix bug on read-side of external sort when using Snappy. + Patrick Wendell + 2014-01-23 17:59:42 -0800 + Commit: 0213b40 + + Remove Hadoop object cloning and warn users making Hadoop RDD's. + Patrick Wendell + 2014-01-23 13:30:54 -0800 + Commit: 7101017 + + Fix SPARK-978: ClassCastException in PySpark cartesian. + Josh Rosen + 2014-01-23 15:09:19 -0800 + Commit: 6156990 + + Fix SPARK-1034: Py4JException on PySpark Cartesian Result + Josh Rosen + 2014-01-23 13:05:59 -0800 + Commit: 0035dbb + + fad6aac 2014-01-23 11:14:15 -0800 + Merge pull request #406 from eklavya/master + [Extending Java API coverage] + + a2b47da 2014-01-23 10:48:26 -0800 + Merge pull request #499 from jianpingjwang/dev1 + [Replace commons-math with jblas in SVDPlusPlus] + + fixed ClassTag in mapPartitions + eklavya + 2014-01-23 17:40:36 +0530 + Commit: 60e7457 + + Add jblas dependency + Jianping J Wang + 2014-01-23 19:54:01 +0800 + Commit: 19a01c1 + + Add jblas dependency + Jianping J Wang + 2014-01-23 19:48:39 +0800 + Commit: a5a513e + + Replace commons-math with jblas + Jianping J Wang + 2014-01-23 19:44:30 +0800 + Commit: cc0fd33 + + a1cd185 2014-01-22 19:37:29 -0800 + Merge pull request #496 from pwendell/master + [Fix bug in worker clean-up in UI] + + 034dce2 2014-01-22 18:58:02 -0800 + Merge pull request #447 from CodingCat/SPARK-1027 + [fix for SPARK-1027] + + Fix bug in worker clean-up in UI + Patrick Wendell + 2014-01-22 18:19:46 -0800 + Commit: 6285513 + + refactor sparkHome to val + CodingCat + 2014-01-22 19:32:51 -0500 + Commit: 2b3c461 + + 3184fac 2014-01-22 15:45:04 -0800 + Merge pull request #495 from srowen/GraphXCommonsMathDependency + [Fix graphx Commons Math dependency] + + Also add graphx commons-math3 dependeny in sbt build + Sean Owen + 2014-01-22 22:40:41 +0000 + Commit: 4476398 + + a1238bb 2014-01-22 14:32:59 -0800 + Merge pull request #492 from skicavs/master + [fixed job name and usage information for the JavaSparkPi example] + + Depend on Commons Math explicitly instead of accidentally getting it from Hadoop (which stops working in 2.2.x) and also use the newer commons-math3 + Sean Owen + 2014-01-22 22:25:49 +0000 + Commit: fd0c5b8 + + 576c4a4 2014-01-22 14:10:07 -0800 + Merge pull request #478 from sryza/sandy-spark-1033 + [SPARK-1033. Ask for cores in Yarn container requests] + + 5bcfd79 2014-01-22 14:05:48 -0800 + Merge pull request #493 from kayousterhout/double_add + [Fixed bug where task set managers are added to queue twice] + + d009b17 2014-01-22 14:01:30 -0800 + Merge pull request #315 from rezazadeh/sparsesvd + [Sparse SVD] + + Fixed bug where task set managers are added to queue twice + Kay Ousterhout + 2014-01-22 09:49:31 -0800 + Commit: 19da82c + + fixed job name and usage information for the JavaSparkPi example + Kevin Mader + 2014-01-22 15:58:23 +0100 + Commit: 36f9a64 + + Replace the code to check for Option != None with Option.isDefined call in Scala code. + Henry Saputra + 2014-01-21 23:22:10 -0800 + Commit: 90ea9d5 + + 749f842 2014-01-21 14:53:49 -0800 + Merge pull request #489 from ash211/patch-6 + [Clarify spark.default.parallelism] + + Clarify spark.default.parallelism + Andrew Ash + 2014-01-21 14:49:35 -0800 + Commit: 069bb94 + + f854498 2014-01-21 10:49:54 -0800 + Merge pull request #469 from ajtulloch/use-local-spark-context-in-tests-for-mllib + [[MLlib] Use a LocalSparkContext trait in test suites] + + Fixed import order + Andrew Tulloch + 2014-01-21 13:34:59 +0000 + Commit: 3a067b4 + + Incorporate Tom's comments - update doc and code to reflect that core requests may not always be honored + Sandy Ryza + 2014-01-21 00:38:02 -0800 + Commit: adf4261 + + 77b986f 2014-01-21 00:09:42 -0800 + Merge pull request #480 from pwendell/0.9-fixes + [Handful of 0.9 fixes] + + Style clean-up + Patrick Wendell + 2014-01-20 23:42:24 -0800 + Commit: a9bcc98 + + c67d3d8 2014-01-20 23:34:35 -0800 + Merge pull request #484 from tdas/run-example-fix + [Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM.] + + Removed SPARK_MEM from run-examples. + Tathagata Das + 2014-01-20 23:15:28 -0800 + Commit: 65869f8 + + Adding small code comment + Patrick Wendell + 2014-01-20 23:11:45 -0800 + Commit: a917a87 + + 6b4eed7 2014-01-20 22:35:45 -0800 + Merge pull request #449 from CrazyJvm/master + [SPARK-1028 : fix "set MASTER automatically fails" bug.] + + 0367981 2014-01-20 22:25:50 -0800 + Merge pull request #482 from tdas/streaming-example-fix + [Added StreamingContext.awaitTermination to streaming examples] + + 7373ffb 2014-01-20 21:44:29 -0800 + Merge pull request #483 from pwendell/gitignore + [Restricting /lib to top level directory in .gitignore] + + Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM. + Tathagata Das + 2014-01-20 20:48:59 -0800 + Commit: e0b741d + + Restricting /lib to top level directory in .gitignore + Patrick Wendell + 2014-01-20 20:39:10 -0800 + Commit: e437069 + + Added StreamingContext.awaitTermination to streaming examples. + Tathagata Das + 2014-01-20 20:25:04 -0800 + Commit: 2e95174 + + Avoid matching attempt files in the checkpoint + Patrick Wendell + 2014-01-20 20:02:02 -0800 + Commit: d46df96 + + Remove shuffle files if they are still present on a machine. + Patrick Wendell + 2014-01-20 19:11:22 -0800 + Commit: de526ad + + Fixing speculation bug + Patrick Wendell + 2014-01-20 19:05:03 -0800 + Commit: f84400e + + Force use of LZF when spilling data + Patrick Wendell + 2014-01-20 19:00:48 -0800 + Commit: c324ac1 + + Bug fix for reporting of spill output + Patrick Wendell + 2014-01-20 18:34:00 -0800 + Commit: 1b29914 + + Minor fixes + Patrick Wendell + 2014-01-20 18:33:21 -0800 + Commit: 54867e9 + + Removing docs on akka options + Patrick Wendell + 2014-01-20 16:35:26 -0800 + Commit: cdb003e + + SPARK-1033. Ask for cores in Yarn container requests + Sandy Ryza + 2014-01-19 10:16:25 -0800 + Commit: 3e85b87 + + fix for SPARK-1027 + CodingCat + 2014-01-15 20:46:14 -0500 + Commit: 29f4b6a + + executor creation failed should not make the worker restart + CodingCat + 2014-01-15 19:32:50 -0500 + Commit: f9a95d6 + + 792d908 2014-01-19 11:33:11 -0800 + Merge pull request #470 from tgravescs/fix_spark_examples_yarn + [Only log error on missing jar to allow spark examples to jar.] + + 256a355 2014-01-19 10:29:54 -0800 + Merge pull request #458 from tdas/docs-update + [Updated java API docs for streaming, along with very minor changes in the code examples.] + + update comment + Thomas Graves + 2014-01-19 12:21:39 -0600 + Commit: dd56b21 + + Only log error on missing jar to allow spark examples to jar. + Thomas Graves + 2014-01-19 12:16:58 -0600 + Commit: ceb79a3 + + LocalSparkContext for MLlib + Andrew Tulloch + 2014-01-19 17:51:00 +0000 + Commit: 720836a + + Addressed comments from Reynold + Yinan Li + 2014-01-18 21:28:17 -0800 + Commit: 584323c + + fe8a354 2014-01-18 16:29:23 -0800 + Merge pull request #459 from srowen/UpdaterL2Regularization + [Correct L2 regularized weight update with canonical form] + + 73dfd42 2014-01-18 16:23:56 -0800 + Merge pull request #437 from mridulm/master + [Minor api usability changes] + + 4c16f79 2014-01-18 16:21:43 -0800 + Merge pull request #426 from mateiz/py-ml-tests + [Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+)] + + bf56995 2014-01-18 16:17:34 -0800 + Merge pull request #462 from mateiz/conf-file-fix + [Remove Typesafe Config usage and conf files to fix nested property names] + + Allow files added through SparkContext.addFile() to be overwritten + Yinan Li + 2014-01-17 17:27:25 -0800 + Commit: fd833e7 + + aa981e4 2014-01-18 12:49:21 -0800 + Merge pull request #461 from pwendell/master + [Use renamed shuffle spill config in CoGroupedRDD.scala] + + Use renamed shuffle spill config in CoGroupedRDD.scala + Patrick Wendell + 2014-01-18 11:55:10 -0800 + Commit: 5316bca + + Correct L2 regularized weight update with canonical form + Sean Owen + 2014-01-18 12:53:01 +0000 + Commit: e91ad3f + + rename to MatrixSVD + Reza Zadeh + 2014-01-17 14:40:51 -0800 + Commit: 85b95d0 + + rename to MatrixSVD + Reza Zadeh + 2014-01-17 14:39:30 -0800 + Commit: fa32998 + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-17 14:34:03 -0800 + Commit: caf97a2 + + make example 0-indexed + Reza Zadeh + 2014-01-17 14:33:03 -0800 + Commit: 4e96757 + + 0index docs + Reza Zadeh + 2014-01-17 14:31:39 -0800 + Commit: 5c639d7 + + prettify + Reza Zadeh + 2014-01-17 14:14:29 -0800 + Commit: c9b4845 + + add rename computeSVD + Reza Zadeh + 2014-01-17 13:59:05 -0800 + Commit: dbec69b + + replace this.type with SVD + Reza Zadeh + 2014-01-17 13:57:27 -0800 + Commit: eb2d8c4 + + use 0-indexing + Reza Zadeh + 2014-01-17 13:55:42 -0800 + Commit: cb13b15 + + changes from PR + Reza Zadeh + 2014-01-17 13:39:40 -0800 + Commit: d28bf41 + + Address review comment + Mridul Muralidharan + 2014-01-17 18:28:55 +0530 + Commit: b690e11 + + d749d47 2014-01-16 23:18:15 -0800 + Merge pull request #451 from Qiuzhuang/master + [Fixed Window spark shell launch script error.] + + d4fd89e 2014-01-16 23:17:30 -0800 + Merge pull request #438 from ScrapCodes/clone-records-java-api + [Clone records java api] + + adding clone records field to equivaled java apis + Prashant Sharma + 2014-01-14 20:13:55 +0530 + Commit: fcb4fc6 + + Updated java API docs for streaming, along with very minor changes in the code examples. + Tathagata Das + 2014-01-16 14:44:02 -0800 + Commit: 11e6534 + + Use method, not variable + Mridul Muralidharan + 2014-01-16 17:26:42 +0530 + Commit: edd82c5 + + Address review comments + Mridul Muralidharan + 2014-01-16 17:23:25 +0530 + Commit: 1a0da89 + + Fixed Window spark shell launch script error. JIRA SPARK-1029:https://spark-project.atlassian.net/browse/SPARK-1029 + Qiuzhuang Lian + 2014-01-16 16:09:10 +0800 + Commit: 4e510b0 + + c06a307 2014-01-15 23:47:25 -0800 + Merge pull request #445 from kayousterhout/exec_lost + [Fail rather than hanging if a task crashes the JVM.] + + Updated unit test comment + Kay Ousterhout + 2014-01-15 23:46:14 -0800 + Commit: 718a13c + + 84595ea 2014-01-15 20:15:29 -0800 + Merge pull request #414 from soulmachine/code-style + [Code clean up for mllib] + + fix some format problem. + CrazyJvm + 2014-01-16 11:57:46 +0800 + Commit: 8400536 + + fix "set MASTER automatically fails" bug. + CrazyJvm + 2014-01-16 11:45:02 +0800 + Commit: 7a0c5b5 + + 0675ca5 2014-01-15 16:09:03 -0800 + Merge pull request #439 from CrazyJvm/master + [SPARK-1024 Remove "-XX:+UseCompressedStrings" option from tuning guide] + + Fail rather than hanging if a task crashes the JVM. + Kay Ousterhout + 2014-01-15 16:03:40 -0800 + Commit: a268d63 + + 4f0c361 2014-01-15 14:25:45 -0800 + Merge pull request #444 from mateiz/py-version + [Clarify that Python 2.7 is only needed for MLlib] + + Clarify that Python 2.7 is only needed for MLlib + Matei Zaharia + 2014-01-15 14:20:39 -0800 + Commit: 2ffdaef + + 59f475c 2014-01-15 13:55:14 -0800 + Merge pull request #442 from pwendell/standalone + [Workers should use working directory as spark home if it's not specified] + + 2a05403 2014-01-15 13:54:45 -0800 + Merge pull request #443 from tdas/filestream-fix + [Made some classes private[stremaing] and deprecated a method in JavaStreamingContext.] + + Made some classes private[stremaing] and deprecated a method in JavaStreamingContext. + Tathagata Das + 2014-01-15 12:15:46 -0800 + Commit: 9e63753 + + 5fecd25 2014-01-15 11:15:07 -0800 + Merge pull request #441 from pwendell/graphx-build + [GraphX shouldn't list Spark as provided.] + + Workers should use working directory as spark home if it's not specified + Patrick Wendell + 2014-01-15 10:58:02 -0800 + Commit: 00a3f7e + + GraphX shouldn't list Spark as provided + Patrick Wendell + 2014-01-15 10:44:17 -0800 + Commit: 9259d70 + + 494d3c0 2014-01-15 10:00:50 -0800 + Merge pull request #433 from markhamstra/debFix + [Updated Debian packaging] + + cef2af9 2014-01-15 10:06:17 -0600 + Merge pull request #366 from colorant/yarn-dev + [More yarn code refactor] + + remove "-XX:+UseCompressedStrings" option + CrazyJvm + 2014-01-15 22:26:15 +0800 + Commit: 263933d + + 3d9e66d 2014-01-14 23:17:05 -0800 + Merge pull request #436 from ankurdave/VertexId-case + [Rename VertexID -> VertexId in GraphX] + + Expose method and class - so that we can use it from user code (particularly since checkpoint directory is autogenerated now + Mridul Muralidharan + 2014-01-15 12:44:44 +0530 + Commit: 0aea33d + + 139c24e 2014-01-14 23:07:55 -0800 + Merge pull request #435 from tdas/filestream-fix + [Fixed the flaky tests by making SparkConf not serializable] + + 087487e 2014-01-14 22:50:36 -0800 + Merge pull request #434 from rxin/graphxmaven + [Fixed SVDPlusPlusSuite in Maven build.] + + Merge remote-tracking branch 'apache/master' into filestream-fix + Tathagata Das + 2014-01-14 22:21:20 -0800 + Commit: 0e15bd7 + + Changed SparkConf to not be serializable. And also fixed unit-test log paths in log4j.properties of external modules. + Tathagata Das + 2014-01-14 22:20:14 -0800 + Commit: 1f4718c + + Fixed SVDPlusPlusSuite in Maven build. + Reynold Xin + 2014-01-14 22:18:43 -0800 + Commit: dfb1524 + + Removed repl-bin and updated maven build doc. + Mark Hamstra + 2014-01-14 21:36:58 -0800 + Commit: 147a943 + + VertexID -> VertexId + Ankur Dave + 2014-01-14 22:17:18 -0800 + Commit: f4d9019 + + Add deb profile to assembly/pom.xml + Mark Hamstra + 2014-01-14 21:23:09 -0800 + Commit: 148757e + + 3a386e2 2014-01-14 21:52:50 -0800 + Merge pull request #424 from jegonzal/GraphXProgrammingGuide + [Additional edits for clarity in the graphx programming guide.] + + ad294db 2014-01-14 21:51:06 -0800 + Merge pull request #431 from ankurdave/graphx-caching-doc + [Describe caching and uncaching in GraphX programming guide] + + Describe GraphX caching and uncaching in guide + Ankur Dave + 2014-01-14 17:24:25 -0800 + Commit: 1210ec2 + + 74b46ac 2014-01-14 14:59:13 -0800 + Merge pull request #428 from pwendell/writeable-objects + [Don't clone records for text files] + + 193a075 2014-01-14 14:53:24 -0800 + Merge pull request #429 from ankurdave/graphx-examples-pom.xml + [Add GraphX dependency to examples/pom.xml] + + d601a76 2014-01-14 14:52:24 -0800 + Merge pull request #427 from pwendell/deprecate-aggregator + [Deprecate rather than remove old combineValuesByKey function] + + Add GraphX dependency to examples/pom.xml + Ankur Dave + 2014-01-14 13:57:51 -0800 + Commit: 8ea056d + + Style fix + Patrick Wendell + 2014-01-14 13:56:27 -0800 + Commit: b1b22b7 + + Adding fix covering combineCombinersByKey as well + Patrick Wendell + 2014-01-14 13:52:23 -0800 + Commit: 8ea2cd5 + + 2ce23a5 2014-01-14 13:28:44 -0800 + Merge pull request #425 from rxin/scaladoc + [API doc update & make Broadcast public] + + Complain if Python and NumPy versions are too old for MLlib + Matei Zaharia + 2014-01-14 12:27:58 -0800 + Commit: 5b3a3e2 + + Deprecate rather than remove old combineValuesByKey function + Patrick Wendell + 2014-01-14 12:15:10 -0800 + Commit: b683608 + + Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+) + Matei Zaharia + 2014-01-14 12:14:48 -0800 + Commit: 938e4a0 + + Don't clone records for text files + Patrick Wendell + 2014-01-14 11:57:53 -0800 + Commit: 6f965a4 + + Fixed a typo in JavaSparkContext's API doc. + Reynold Xin + 2014-01-14 11:42:28 -0800 + Commit: f12e506 + + Maintain Serializable API compatibility by reverting back to java.io.Serializable for Broadcast and Accumulator. + Reynold Xin + 2014-01-14 11:30:59 -0800 + Commit: 1b5623f + + Added license header for package.scala in the Java API package. + Reynold Xin + 2014-01-14 11:20:12 -0800 + Commit: 55db774 + + Added package doc for the Java API. + Reynold Xin + 2014-01-14 11:16:25 -0800 + Commit: f8c12e9 + + Updated API doc for Accumulable and Accumulator. + Reynold Xin + 2014-01-14 11:16:08 -0800 + Commit: 6a12b9e + + Broadcast variable visibility change & doc update. + Reynold Xin + 2014-01-14 11:15:21 -0800 + Commit: 71b3007 + + Additional edits for clarity in the graphx programming guide. + Joseph E. Gonzalez + 2014-01-14 10:31:43 -0800 + Commit: 0bba773 + + 3fcc68b 2014-01-14 09:44:43 -0800 + Merge pull request #423 from jegonzal/GraphXProgrammingGuide + [Improving the graphx-programming-guide] + + Improving the graphx-programming-guide. + Joseph E. Gonzalez + 2014-01-14 09:40:06 -0800 + Commit: 486f37c + + Added parentheses for that getDouble() also has side effect + Frank Dai + 2014-01-14 18:56:11 +0800 + Commit: 57fcfc7 + + fa75e5e 2014-01-14 01:18:34 -0800 + Merge pull request #420 from pwendell/header-files + [Add missing header files] + + Add missing header files + Patrick Wendell + 2014-01-14 01:14:20 -0800 + Commit: 2303479 + + Modifications as suggested in PR feedback- + Saurabh Rawat + 2014-01-14 14:19:02 +0530 + Commit: 1442cd5 + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-13 23:52:34 -0800 + Commit: 845e568 + + Merge remote-tracking branch 'upstream/master' into code-style + Frank Dai + 2014-01-14 15:29:17 +0800 + Commit: a3da468 + + Indent two spaces + Frank Dai + 2014-01-14 14:59:01 +0800 + Commit: c2852cf + + Since getLong() and getInt() have side effect, get back parentheses, and remove an empty line + Frank Dai + 2014-01-14 14:53:10 +0800 + Commit: 12386b3 + + Code clean up for mllib + Frank Dai + 2014-01-14 14:37:26 +0800 + Commit: 0d94d74 + + Address comments to fix code formats + Raymond Liu + 2014-01-10 09:44:44 +0800 + Commit: 4c22c55 + + Yarn workerRunnable refactor + Raymond Liu + 2014-01-09 14:16:07 +0800 + Commit: 161ab93 + + Yarn Client refactor + Raymond Liu + 2014-01-09 09:53:50 +0800 + Commit: 79a5ba3 + + Modifications as suggested in PR feedback- + Saurabh Rawat + 2014-01-13 23:40:04 +0530 + Commit: e922973 + + Remove default param from mapPartitions + eklavya + 2014-01-13 18:13:22 +0530 + Commit: fa42951 + + Remove classtag from mapPartitions. + eklavya + 2014-01-13 18:09:58 +0530 + Commit: 8fe562c + + Added foreachPartition method to JavaRDD. + eklavya + 2014-01-13 17:56:47 +0530 + Commit: 6a65fee + + Added mapPartitions method to JavaRDD. + eklavya + 2014-01-13 17:56:10 +0530 + Commit: dbadc6b + + Added setter method setGenerator to JavaRDD. + eklavya + 2014-01-13 17:53:35 +0530 + Commit: aae8a01 + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-11 13:27:15 -0800 + Commit: f324d53 + + add dimension parameters to example + Reza Zadeh + 2014-01-10 21:30:54 -0800 + Commit: 1afdeae + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-09 22:45:32 -0800 + Commit: 21c8a54 + + fix example + Reza Zadeh + 2014-01-09 22:39:41 -0800 + Commit: cf5bd4a + + documentation for sparsematrix + Reza Zadeh + 2014-01-07 17:19:28 -0800 + Commit: 4f38b6f + + More sparse matrix usage. + Reza Zadeh + 2014-01-07 17:16:17 -0800 + Commit: 7d7490b + + fix docs to use SparseMatrix + Reza Zadeh + 2014-01-05 18:03:57 -0800 + Commit: 746148b + + use SparseMatrix everywhere + Reza Zadeh + 2014-01-04 14:28:07 -0800 + Commit: 06c0f76 + + prettify + Reza Zadeh + 2014-01-04 12:44:04 -0800 + Commit: cdff9fc + + new example file + Reza Zadeh + 2014-01-04 12:33:22 -0800 + Commit: e9bd6cb + + fix tests + Reza Zadeh + 2014-01-04 11:52:42 -0800 + Commit: 8bfcce1 + + set methods + Reza Zadeh + 2014-01-04 11:30:36 -0800 + Commit: 35adc72 + + add k parameter + Reza Zadeh + 2014-01-04 01:52:28 -0800 + Commit: 73daa70 + + using decomposed matrix struct now + Reza Zadeh + 2014-01-04 00:38:53 -0800 + Commit: 26a74f0 + + new return struct + Reza Zadeh + 2014-01-04 00:15:04 -0800 + Commit: d2d5e5e + + start using matrixentry + Reza Zadeh + 2014-01-03 22:17:24 -0800 + Commit: 7f631dd + + rename sparsesvd.scala + Reza Zadeh + 2014-01-03 21:55:38 -0800 + Commit: 6bcdb76 + + New matrix entry file + Reza Zadeh + 2014-01-03 21:54:57 -0800 + Commit: b059a2a + + fix error message + Reza Zadeh + 2014-01-02 01:51:38 -0800 + Commit: e617ae2 + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-02 01:50:30 -0800 + Commit: 6140578 + + more docs yay + Reza Zadeh + 2014-01-01 20:22:29 -0800 + Commit: 2612164 + + javadoc for sparsesvd + Reza Zadeh + 2014-01-01 20:20:16 -0800 + Commit: 915d53f + + old version of spark_ec2 + Reza Zadeh + 2014-01-01 20:08:01 -0800 + Commit: c868d71 + + remove accidental changes to ec2 script + Reza Zadeh + 2014-01-01 20:05:03 -0800 + Commit: 0c3797d + + doc tweaks + Reza Zadeh + 2014-01-01 20:03:47 -0800 + Commit: 53ccf65 + + doc tweak + Reza Zadeh + 2014-01-01 20:02:37 -0800 + Commit: 97dc527 + + doc tweaks + Reza Zadeh + 2014-01-01 20:01:13 -0800 + Commit: b941b6f + + tweaks to docs + Reza Zadeh + 2014-01-01 19:53:14 -0800 + Commit: 185c882 + + New documentation + Reza Zadeh + 2014-01-01 19:53:04 -0800 + Commit: dd0d3f0 + + Merge remote-tracking branch 'upstream/master' into sparsesvd + Reza Zadeh + 2014-01-01 18:12:35 -0800 + Commit: 7c04b31 + + large scale considerations + Reza Zadeh + 2013-12-27 04:15:13 -0500 + Commit: ae5102a + + initial large scale testing begin + Reza Zadeh + 2013-12-27 01:51:19 -0500 + Commit: 642ab5c + + cleanup documentation + Reza Zadeh + 2013-12-27 00:41:46 -0500 + Commit: 3369c2d + + add all tests + Reza Zadeh + 2013-12-27 00:36:41 -0500 + Commit: bdb5037 + + test for truncated svd + Reza Zadeh + 2013-12-27 00:34:59 -0500 + Commit: fa1e8d8 + + full rank matrix test added + Reza Zadeh + 2013-12-26 23:21:57 -0500 + Commit: 16de526 + + Main method added for svd + Reza Zadeh + 2013-12-26 18:13:21 -0500 + Commit: fe1a132 + + new main file + Reza Zadeh + 2013-12-26 18:09:33 -0500 + Commit: 1a21ba2 + + Object to hold the svd methods + Reza Zadeh + 2013-12-26 17:39:25 -0500 + Commit: 6c3674c + + Some documentation + Reza Zadeh + 2013-12-26 16:12:40 -0500 + Commit: 6e740cc + + Initial files - no tests + Reza Zadeh + 2013-12-26 15:01:03 -0500 + Commit: 1a173f0 + + +Release 0.9.1 + + Revert "[maven-release-plugin] prepare release v0.9.1-rc2" + Tathagata Das + 2014-03-26 21:53:07 -0700 + Commit: ea5da04 + + Revert "[maven-release-plugin] prepare for next development iteration" + Tathagata Das + 2014-03-26 21:51:40 -0700 + Commit: d16e863 + + [SPARK-1327] GLM needs to check addIntercept for intercept and weights + Xiangrui Meng + 2014-03-26 19:30:57 -0700 + Commit: 4901604, github.com/apache/spark/pull/236 + + SPARK-1322, top in pyspark should sort result in descending order. + Prashant Sharma + 2014-03-26 11:15:02 -0700 + Commit: 2f90dc5, github.com/apache/spark/pull/235 + + [maven-release-plugin] prepare for next development iteration + Ubuntu + 2014-03-26 09:26:45 +0000 + Commit: 1f785d4 + + [maven-release-plugin] prepare release v0.9.1-rc2 + Ubuntu + 2014-03-26 09:26:40 +0000 + Commit: 1197280 + + Updated CHANGES.txt + Tathagata Das + 2014-03-26 02:10:57 -0700 + Commit: 7495dba + + [SPARK-782] Made Spark use existing shaded ASM and removed Spark's ASM dependency + Tathagata Das + 2014-03-25 21:35:36 -0700 + Commit: da87240, github.com/apache/spark/pull/232 + + Revert "[maven-release-plugin] prepare release v0.9.1-rc1" + Tathagata Das + 2014-03-25 15:01:52 -0700 + Commit: 55abe72 + + Revert "[maven-release-plugin] prepare for next development iteration" + Tathagata Das + 2014-03-25 15:01:36 -0700 + Commit: b94f997 + + [maven-release-plugin] prepare for next development iteration + Ubuntu + 2014-03-24 06:56:16 +0000 + Commit: 12e237e + + [maven-release-plugin] prepare release v0.9.1-rc1 + Ubuntu + 2014-03-24 06:56:10 +0000 + Commit: 81c6a06 + + Removed all occurences of incubator from all the pom.xml. + Tathagata Das + 2014-03-23 23:31:59 -0700 + Commit: 60ddb34 + + Updated CHANGES.txt file. + Tathagata Das + 2014-03-23 13:16:50 -0700 + Commit: f176b03 + + Fix to Stage UI to display numbers on progress bar + Emtiaz Ahmed + 2014-03-21 18:07:05 -0700 + Commit: 5e7ac0d, github.com/apache/spark/pull/201 + + SPARK-1284: Fix improper use of SimpleDateFormat + zsxwing + 2014-03-21 16:39:23 -0700 + Commit: 8856076, github.com/apache/spark/pull/179 + + [SPARK-1273] use doi links in mllib-guide + Xiangrui Meng + 2014-03-21 14:35:32 -0700 + Commit: d68549e, github.com/apache/spark/pull/198 + + Removed incubating from Spark version in all the pom.xml. + Tathagata Das + 2014-03-20 18:02:55 -0700 + Commit: 8b1e793 + + Bumped versions to Spark 0.9.1 + Tathagata Das + 2014-03-20 16:55:35 -0700 + Commit: 8a882ef, github.com/apache/spark/pull/190 + + SPARK-1032. If Yarn app fails before registering, app master stays aroun... + Sandy Ryza + 2014-03-20 16:50:44 -0500 + Commit: c6630d3, github.com/apache/spark/pull/28 + + SPARK-1051. On YARN, executors don't doAs submitting user + Sandy Ryza + 2014-03-20 14:48:05 -0500 + Commit: 748f002, github.com/apache/spark/pull/29 + + [SPARK-1285] Backporting updates to streaming docs to branch 0.9 + Aaron Kimball , Tathagata Das , Chen Chao , Andrew Or + 2014-03-20 12:27:47 -0700 + Commit: 1e36690, github.com/apache/spark/pull/183 + + [SPARK-1273] MLlib bug fixes, improvements, and doc updates for v0.9.1 + Xiangrui Meng , Sean Owen , Andrew Tulloch , Chen Chao + 2014-03-19 19:05:26 -0700 + Commit: 1cc979e, github.com/apache/spark/pull/175 + + [SPARK-1275] Made dev/run-tests executable. + Tathagata Das + 2014-03-19 16:10:45 -0700 + Commit: a4eef65, github.com/apache/spark/pull/178 + + Update the yarn alpha version to 0.9.1-incubating-SNAPSHOT + Thomas Graves + 2014-03-19 12:41:11 -0500 + Commit: 72875b2 + + SPARK-1203 fix saving to hdfs from yarn + Thomas Graves + 2014-03-19 08:19:47 -0500 + Commit: 250ec27, github.com/apache/spark/pull/173 + + bugfix: Wrong "Duration" in "Active Stages" in stages page + shiyun.wxm + 2014-03-19 01:42:42 -0700 + Commit: d385b5a, github.com/apache/spark/pull/170 + + [SPARK-1274] Add dev scripts to merge PRs and create releases from master to branch-0.9 + Tathagata Das + 2014-03-18 22:09:16 -0700 + Commit: 7ec78bc, github.com/apache/spark/pull/176 + + Bundle tachyon: SPARK-1269 + Nick Lanham + 2014-03-18 22:05:18 -0700 + Commit: 0183ddd, github.com/apache/spark/pull/137 + + [Spark-1261] add instructions for running python examples to doc overview page + Diana Carroll + 2014-03-17 17:37:03 -0700 + Commit: 20d9458, github.com/apache/spark/pull/162 + + SPARK-1244: Throw exception if map output status exceeds frame size + Patrick Wendell , Andrew Or + 2014-03-17 14:06:28 -0700 + Commit: 4562140, github.com/apache/spark/pull/152 + + SPARK-1240: handle the case of empty RDD when takeSample + CodingCat + 2014-03-16 22:40:22 -0700 + Commit: af7e8b1, github.com/apache/spark/pull/135 + + SPARK-977 Added Python RDD.zip function + Prabin Banka + 2014-03-16 22:16:17 -0700 + Commit: 1dc1e98, github.com/apache/spark/pull/76 + + Spark-1163, Added missing Python RDD functions + prabinb + 2014-03-16 22:14:53 -0700 + Commit: 249930a, github.com/apache/spark/pull/92 + + SPARK-1168, Added foldByKey to pyspark. + Prashant Sharma + 2014-03-16 22:13:33 -0700 + Commit: 4480505, github.com/apache/spark/pull/115 + + Updated link for pyspark examples in docs + Jyotiska NK + 2014-03-16 22:12:51 -0700 + Commit: e74e79a, github.com/apache/spark/pull/22 + + SPARK-1019: pyspark RDD take() throws an NPE + Patrick Wendell + 2014-03-12 23:17:17 -0700 + Commit: ef74e44, github.com/apache/spark/pull/112 + + Fix example bug: compile error + jianghan + 2014-03-12 19:46:48 -0700 + Commit: 87e4dd5, github.com/apache/spark/pull/132 + + SPARK-1162 Added top in python. + Prashant Sharma + 2014-03-12 15:57:54 -0700 + Commit: 51a77e9, github.com/apache/spark/pull/93 + + Version fix in pom file + Patrick Wendell + 2014-03-11 14:48:01 -0700 + Commit: 7049164 + + Log4j build fix on 0.9 branch + Patrick Wendell + 2014-03-11 11:53:29 -0700 + Commit: 6cbd580 + + SPARK-1167: Remove metrics-ganglia from default build due to LGPL issues... + Patrick Wendell + 2014-03-11 11:24:21 -0700 + Commit: 0c91927, github.com/apache/spark/pull/108 + + For outputformats that are Configurable, call setConf before sending data to them. + Bryn Keller + 2014-03-09 17:47:46 -0700 + Commit: 6f0db0a, github.com/apache/spark/pull/638 + + SPARK-1190: Do not initialize log4j if slf4j log4j backend is not being used + Patrick Wendell + 2014-03-08 16:02:56 -0800 + Commit: 0f0d044, github.com/apache/spark/pull/107 + + SPARK-1184: Update the distribution tar.gz to include spark-assembly jar + Mark Grover + 2014-03-05 16:55:36 -0800 + Commit: 0fc0fdb, github.com/apache/spark/pull/78 + + SPARK-1109 wrong API docs for pyspark map function + Prashant Sharma + 2014-03-04 15:33:00 -0800 + Commit: 7ea89ec, github.com/apache/spark/pull/73 + + Add Jekyll tag to isolate "production-only" doc components. (0.9 version) + Patrick Wendell + 2014-03-02 18:18:44 -0800 + Commit: 267d96c, github.com/apache/spark/pull/57 + + Removed reference to incubation in Spark user docs. + Reynold Xin + 2014-02-27 21:14:18 -0800 + Commit: f2bf44a, github.com/apache/spark/pull/2 + + [SPARK-1089] fix the regression problem on ADD_JARS in 0.9 + CodingCat + 2014-02-26 23:42:53 -0800 + Commit: bc5e7d7, github.com/apache/spark/pull/13 + + Removed reference to incubation in README.md. + Reynold Xin + 2014-02-26 16:53:56 -0800 + Commit: 349764d, github.com/apache/spark/pull/1 + + SPARK-1115: Catch depickling errors + Bouke van der Bijl + 2014-02-26 14:53:30 -0800 + Commit: 886a466, github.com/apache/incubator-spark/pull/644 + + SPARK-1135: fix broken anchors in docs + Matei Zaharia + 2014-02-26 11:56:12 -0800 + Commit: 6fe72dd, github.com/apache/spark/pull/3 + + Fix removal from shuffleToMapStage to search for a key-value pair with our stage instead of using our shuffleID. + Matei Zaharia + 2014-02-24 17:01:21 -0800 + Commit: 0661cdc + + SPARK-1124: Fix infinite retries of reduce stage when a map stage failed + Matei Zaharia + 2014-02-24 17:00:47 -0800 + Commit: 5e74b8e + + [SPARK-1055] fix the SCALA_VERSION and SPARK_VERSION in docker file + CodingCat , Nan Zhu + 2014-02-22 15:39:41 -0800 + Commit: 00db30c, github.com/apache/incubator-spark/pull/634 + + SPARK-1117: update accumulator docs + Xiangrui Meng + 2014-02-21 22:44:59 -0800 + Commit: ed58742, github.com/apache/incubator-spark/pull/631 + + [SPARK-1113] External spilling - fix Int.MaxValue hash code collision bug + Andrew Or + 2014-02-21 20:06:09 -0800 + Commit: 84131fe, github.com/apache/incubator-spark/pull/624 + + MLLIB-25: Implicit ALS runs out of memory for moderately large numbers of features + Sean Owen + 2014-02-21 13:39:17 -0800 + Commit: 998abae, github.com/apache/incubator-spark/pull/629 + + SPARK-1111: URL Validation Throws Error for HDFS URL's + Patrick Wendell + 2014-02-21 11:12:38 -0800 + Commit: b3fff96, github.com/apache/incubator-spark/pull/625 + + Super minor: Add require for mergeCombiners in combineByKey + Aaron Davidson + 2014-02-20 16:46:29 -0800 + Commit: 3c44ff4, github.com/apache/incubator-spark/pull/623 + + [SPARK-1105] fix site scala version error in docs + CodingCat + 2014-02-19 15:56:24 -0800 + Commit: 289d761, github.com/apache/incubator-spark/pull/618 + + Revert "[SPARK-1105] fix site scala version error in doc" + Patrick Wendell + 2014-02-18 17:47:34 -0800 + Commit: 7bde72e + + [SPARK-1105] fix site scala version error in doc + CodingCat + 2014-02-18 16:33:41 -0800 + Commit: 0f0395c, github.com/apache/incubator-spark/pull/616 + + Worker registration logging fix + Andrew Ash + 2014-02-17 09:52:16 -0800 + Commit: b0b5288, github.com/apache/incubator-spark/pull/608 + + fix for https://spark-project.atlassian.net/browse/SPARK-1052 + Bijay Bisht + 2014-02-16 16:52:57 -0800 + Commit: e797c1a, github.com/apache/incubator-spark/pull/568 + + Add c3 instance types to Spark EC2 + Christian Lundgren + 2014-02-13 12:44:21 -0800 + Commit: 19b4bb2, github.com/apache/incubator-spark/pull/595 + + SPARK-1088: Create a script for running tests so we can have version specific testing on Jenkins (branch-0.9) + Reynold Xin + 2014-02-12 23:42:58 -0800 + Commit: e5b86b1, github.com/apache/incubator-spark/pull/593 + + Ported hadoopClient jar for < 1.0.1 fix + Bijay Bisht + 2014-02-12 23:42:10 -0800 + Commit: 8093de1, github.com/apache/incubator-spark/pull/584 + + 754bc18 2014-02-12 14:26:39 -0800 + Merge pull request #590 from rxin/scalastyle. + [SPARK-1085: Fix Jenkins pull request builder for branch-0.9 (scalastyle command not found)] + + 28f88c5 2014-02-11 22:43:09 -0800 + Merge pull request #583 from colorant/zookeeper. + [Minor fix for ZooKeeperPersistenceEngine to use configured working dir] + + e70690f 2014-02-09 23:33:35 -0800 + Revert "Merge pull request #560 from pwendell/logging. Closes #560." + [This reverts commit 2e3d1c31db55c7f961e559e47bb497ae15cb74d7.] + + de22abc 2014-02-08 23:37:05 -0800 + Merge pull request #562 from jyotiska/master. Closes #562. + [Added example Python code for sort] + + 2e3d1c3 2014-02-08 23:35:41 -0800 + Merge pull request #560 from pwendell/logging. Closes #560. + [[WIP] SPARK-1067: Default log4j initialization causes errors for those not using log4j] + + 22e0a3b 2014-02-08 13:00:07 -0800 + Merge pull request #561 from Qiuzhuang/master. Closes #561. + [Kill drivers in postStop() for Worker.] + + ce179f6 2014-02-06 22:06:30 -0800 + Merge pull request #533 from andrewor14/master. Closes #533. + [External spilling - generalize batching logic] + + 24e5298 2014-02-06 16:15:36 -0800 + Merge pull request #450 from kayousterhout/fetch_failures. Closes #450. + [Only run ResubmitFailedStages event after a fetch fails] + + 94896bb 2014-02-06 16:13:10 -0800 + Merge pull request #321 from kayousterhout/ui_kill_fix. Closes #321. + [Inform DAG scheduler about all started/finished tasks.] + + 44a2b03 2014-02-05 23:38:25 -0800 + Merge pull request #545 from kayousterhout/fix_progress. Closes #545. + [Fix off-by-one error with task progress info log.] + + b044b0b 2014-02-05 23:37:38 -0800 + Merge pull request #526 from tgravescs/yarn_client_stop_am_fix. Closes #526. + [spark on yarn - yarn-client mode doesn't always exit immediately] + + d815cfa 2014-02-04 09:47:25 -0800 + Merge pull request #534 from sslavic/patch-1. Closes #534. + [Fixed wrong path to compute-classpath.cmd] + + f3cba2d 2014-02-04 09:46:00 -0800 + Merge pull request #535 from sslavic/patch-2. Closes #535. + [Fixed typo in scaladoc] + + 5f63f32 2014-02-03 22:44:30 -0800 + Merge pull request #449 from CrazyJvm/master + [SPARK-1028 : fix "set MASTER automatically fails" bug.] + + 6e4d089 2014-02-03 22:42:43 -0800 + Merge pull request #414 from soulmachine/code-style + [Code clean up for mllib] + + 0021ef9 2014-02-03 22:42:01 -0800 + Merge pull request #445 from kayousterhout/exec_lost + [Fail rather than hanging if a task crashes the JVM.] + + dc8adf1 2014-02-03 22:41:30 -0800 + Merge pull request #489 from ash211/patch-6 + [Clarify spark.default.parallelism] + + 574741f 2014-02-03 22:40:55 -0800 + Merge pull request #493 from kayousterhout/double_add + [Fixed bug where task set managers are added to queue twice] + + 1280e8a 2014-02-03 22:40:29 -0800 + Merge pull request #511 from JoshRosen/SPARK-1040 + [Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040)] + + 2c6c9b9 2014-02-03 22:39:59 -0800 + Merge pull request #504 from JoshRosen/SPARK-1025 + [Fix PySpark hang when input files are deleted (SPARK-1025)] + + b10f607 2014-02-03 22:39:10 -0800 + Merge pull request #516 from sarutak/master + [modified SparkPluginBuild.scala to use https protocol for accessing gith...] + + 18520f5 2014-02-03 22:37:38 -0800 + Merge pull request #490 from hsaputra/modify_checkoption_with_isdefined + [Replace the check for None Option with isDefined and isEmpty in Scala code] + + a414071 2014-01-31 16:54:33 -0800 + Merge pull request #524 from rxin/doc + [Added spark.shuffle.file.buffer.kb to configuration doc.] + + a41a83c 2014-01-31 16:53:26 -0800 + Merge pull request #527 from ankurdave/graphx-assembly-pom + [Add GraphX to assembly/pom.xml] + + d18fe1f 2014-01-28 21:55:15 -0800 + Merge pull request #497 from tdas/docs-update + [Updated Spark Streaming Programming Guide] + + 5edbd17 2014-01-28 21:32:58 -0800 + Merge pull request #523 from JoshRosen/SPARK-1043 + [Switch from MUTF8 to UTF8 in PySpark serializers.] + + [maven-release-plugin] prepare for next development iteration + Ubuntu + 2014-01-24 06:15:15 +0000 + Commit: 0f60ef2 + +Release 0.9.0-incubating + + d0a105d Thu Jan 23 20:53:31 2014 -0800 + Merge pull request #505 from JoshRosen/SPARK-1026 + [Deprecate mapPartitionsWithSplit in PySpark (SPARK-1026)] + + e66d4c2 Thu Jan 23 19:47:16 2014 -0800 + Merge pull request #503 from pwendell/master + [Fix bug on read-side of external sort when using Snappy.] + + e8d3f2b Thu Jan 23 19:20:22 2014 -0800 + Merge pull request #502 from pwendell/clone-1 + [Remove Hadoop object cloning and warn users making Hadoop RDD's.] + + 7a62353 Thu Jan 23 19:09:25 2014 -0800 + Merge pull request #501 from JoshRosen/cartesian-rdd-fixes + [Fix two bugs in PySpark cartesian(): SPARK-978 and SPARK-1034] + + 51960b8 Wed Jan 22 19:37:50 2014 -0800 + Merge pull request #496 from pwendell/master + [Fix bug in worker clean-up in UI] + + 828f7b4 Wed Jan 22 15:45:18 2014 -0800 + Merge pull request #495 from srowen/GraphXCommonsMathDependency + [Fix graphx Commons Math dependency] + + dc5857a Wed Jan 22 14:33:25 2014 -0800 + Merge pull request #492 from skicavs/master + [fixed job name and usage information for the JavaSparkPi example] + + dd533c9 Wed Jan 22 14:15:58 2014 -0800 + Merge pull request #478 from sryza/sandy-spark-1033 + [SPARK-1033. Ask for cores in Yarn container requests] + + b6fd3cd Tue Jan 21 00:12:01 2014 -0800 + Merge pull request #480 from pwendell/0.9-fixes + [Handful of 0.9 fixes] + + e5f8917 Mon Jan 20 23:35:07 2014 -0800 + Merge pull request #484 from tdas/run-example-fix + [Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM.] + + 410ba06 Mon Jan 20 22:26:14 2014 -0800 + Merge pull request #482 from tdas/streaming-example-fix + [Added StreamingContext.awaitTermination to streaming examples] + + f137947 Mon Jan 20 22:24:07 2014 -0800 + Merge pull request #483 from pwendell/gitignore + [Restricting /lib to top level directory in .gitignore] + + 94ae25d Sun Jan 19 11:33:51 2014 -0800 + Merge pull request #470 from tgravescs/fix_spark_examples_yarn + [Only log error on missing jar to allow spark examples to jar.] + + 0f077b5 Sun Jan 19 10:30:29 2014 -0800 + Merge pull request #458 from tdas/docs-update + [Updated java API docs for streaming, along with very minor changes in the code examples.] + + 03019d1 Sat Jan 18 16:29:43 2014 -0800 + Merge pull request #459 from srowen/UpdaterL2Regularization + [Correct L2 regularized weight update with canonical form] + + 76147a2 Sat Jan 18 16:24:16 2014 -0800 + Merge pull request #437 from mridulm/master + [Minor api usability changes] + + 4ac8cab Sat Jan 18 16:22:46 2014 -0800 + Merge pull request #426 from mateiz/py-ml-tests + [Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+)] + + 34e911c Sat Jan 18 16:17:34 2014 -0800 + Merge pull request #462 from mateiz/conf-file-fix + [Remove Typesafe Config usage and conf files to fix nested property names] + + ff7201c Sat Jan 18 12:50:02 2014 -0800 + Merge pull request #461 from pwendell/master + [Use renamed shuffle spill config in CoGroupedRDD.scala] + + 7b0d5a5 Thu Jan 16 23:18:48 2014 -0800 + Merge pull request #451 from Qiuzhuang/master + [Fixed Window spark shell launch script error.] + + 4ccedb3 Wed Jan 15 14:26:48 2014 -0800 + Merge pull request #444 from mateiz/py-version + [Clarify that Python 2.7 is only needed for MLlib] + + e3fa36f Wed Jan 15 13:56:04 2014 -0800 + Merge pull request #442 from pwendell/standalone + [Workers should use working directory as spark home if it's not specified] + + 29c76d9 Wed Jan 15 13:55:48 2014 -0800 + Merge pull request #443 from tdas/filestream-fix + [Made some classes private[stremaing] and deprecated a method in JavaStreamingContext.] + + aca40aa Wed Jan 15 11:15:47 2014 -0800 + Merge pull request #441 from pwendell/graphx-build + [GraphX shouldn't list Spark as provided.] + + e12c374 Wed Jan 15 10:01:43 2014 -0800 + Merge pull request #433 from markhamstra/debFix + [Updated Debian packaging] + + 2f015c2 Tue Jan 14 23:17:28 2014 -0800 + Merge pull request #436 from ankurdave/VertexId-case + [Rename VertexID -> VertexId in GraphX] + + 2859cab Tue Jan 14 23:08:19 2014 -0800 + Merge pull request #435 from tdas/filestream-fix + [Fixed the flaky tests by making SparkConf not serializable] + + fbfbb33 Tue Jan 14 23:06:29 2014 -0800 + Merge pull request #434 from rxin/graphxmaven + [Fixed SVDPlusPlusSuite in Maven build.] + + 2c6c07f Tue Jan 14 21:53:05 2014 -0800 + Merge pull request #424 from jegonzal/GraphXProgrammingGuide + [Additional edits for clarity in the graphx programming guide.] + + 6fa4e02 Tue Jan 14 21:51:25 2014 -0800 + Merge pull request #431 from ankurdave/graphx-caching-doc + [Describe caching and uncaching in GraphX programming guide] + + 2f930d5 Tue Jan 14 15:00:11 2014 -0800 + Merge pull request #428 from pwendell/writeable-objects + [Don't clone records for text files] + + 329c9df Tue Jan 14 14:53:36 2014 -0800 + Merge pull request #429 from ankurdave/graphx-examples-pom.xml + [Add GraphX dependency to examples/pom.xml] + + a14933d Tue Jan 14 14:52:42 2014 -0800 + Merge pull request #427 from pwendell/deprecate-aggregator + [Deprecate rather than remove old combineValuesByKey function] + + 119b6c5 Tue Jan 14 13:29:08 2014 -0800 + Merge pull request #425 from rxin/scaladoc + [API doc update & make Broadcast public] + + bf3b150 Tue Jan 14 09:45:22 2014 -0800 + Merge pull request #423 from jegonzal/GraphXProgrammingGuide + [Improving the graphx-programming-guide] + + 1b4adc2 Tue Jan 14 01:19:24 2014 -0800 + Merge pull request #420 from pwendell/header-files + [Add missing header files] + + b60840e Tue Jan 14 00:48:34 2014 -0800 + Merge pull request #418 from pwendell/0.9-versions + [Version changes for release 0.9.0.] + + 980250b Tue Jan 14 00:05:37 2014 -0800 + Merge pull request #416 from tdas/filestream-fix + [Removed unnecessary DStream operations and updated docs] + + 055be5c Mon Jan 13 23:26:44 2014 -0800 + Merge pull request #415 from pwendell/shuffle-compress + [Enable compression by default for spills] + + fdaabdc Mon Jan 13 23:08:26 2014 -0800 + Merge pull request #380 from mateiz/py-bayes + [Add Naive Bayes to Python MLlib, and some API fixes] + + 4a805af Mon Jan 13 22:58:38 2014 -0800 + Merge pull request #367 from ankurdave/graphx + [GraphX: Unifying Graphs and Tables] + + 945fe7a Mon Jan 13 22:56:12 2014 -0800 + Merge pull request #408 from pwendell/external-serializers + [Improvements to external sorting] + + 68641bc Mon Jan 13 22:54:13 2014 -0800 + Merge pull request #413 from rxin/scaladoc + [Adjusted visibility of various components and documentation for 0.9.0 release.] + + 0ca0d4d Mon Jan 13 22:32:21 2014 -0800 + Merge pull request #401 from andrewor14/master + [External sorting - Add number of bytes spilled to Web UI] + + 08b9fec Mon Jan 13 22:29:03 2014 -0800 + Merge pull request #409 from tdas/unpersist + [Automatically unpersisting RDDs that have been cleaned up from DStreams] + + b07bc02 Mon Jan 13 20:45:22 2014 -0800 + Merge pull request #412 from harveyfeng/master + [Add default value for HadoopRDD's `cloneRecords` constructor arg] + + a2fee38 Mon Jan 13 19:45:26 2014 -0800 + Merge pull request #411 from tdas/filestream-fix + [Improved logic of finding new files in FileInputDStream] + + 01c0d72 Mon Jan 13 16:24:30 2014 -0800 + Merge pull request #410 from rxin/scaladoc1 + [Updated JavaStreamingContext to make scaladoc compile.] + + 8038da2 Mon Jan 13 14:59:30 2014 -0800 + Merge pull request #2 from jegonzal/GraphXCCIssue + [Improving documentation and identifying potential bug in CC calculation.] + + b93f9d4 Mon Jan 13 12:18:05 2014 -0800 + Merge pull request #400 from tdas/dstream-move + [Moved DStream and PairDSream to org.apache.spark.streaming.dstream] + + e6ed13f Sun Jan 12 22:35:14 2014 -0800 + Merge pull request #397 from pwendell/host-port + [Remove now un-needed hostPort option] + + 0b96d85 Sun Jan 12 21:31:43 2014 -0800 + Merge pull request #399 from pwendell/consolidate-off + [Disable shuffle file consolidation by default] + + 0ab505a Sun Jan 12 21:31:04 2014 -0800 + Merge pull request #395 from hsaputra/remove_simpleredundantreturn_scala + [Remove simple redundant return statements for Scala methods/functions] + + 405bfe8 Sun Jan 12 20:04:21 2014 -0800 + Merge pull request #394 from tdas/error-handling + [Better error handling in Spark Streaming and more API cleanup] + + 28a6b0c Sun Jan 12 19:49:36 2014 -0800 + Merge pull request #398 from pwendell/streaming-api + [Rename DStream.foreach to DStream.foreachRDD] + + 074f502 Sun Jan 12 17:01:13 2014 -0800 + Merge pull request #396 from pwendell/executor-env + [Setting load defaults to true in executor] + + 82e2b92 Sun Jan 12 16:55:11 2014 -0800 + Merge pull request #392 from rxin/listenerbus + [Stop SparkListenerBus daemon thread when DAGScheduler is stopped.] + + 288a878 Sat Jan 11 21:53:19 2014 -0800 + Merge pull request #389 from rxin/clone-writables + [Minor update for clone writables and more documentation.] + + dbc11df Sat Jan 11 18:07:13 2014 -0800 + Merge pull request #388 from pwendell/master + [Fix UI bug introduced in #244.] + + 409866b Sat Jan 11 17:12:06 2014 -0800 + Merge pull request #393 from pwendell/revert-381 + [Revert PR 381] + + 6510f04 Sat Jan 11 12:48:26 2014 -0800 + Merge pull request #387 from jerryshao/conf-fix + [Fix configure didn't work small problem in ALS] + + ee6e7f9 Sat Jan 11 12:07:55 2014 -0800 + Merge pull request #359 from ScrapCodes/clone-writables + [We clone hadoop key and values by default and reuse objects if asked to.] + + 4216178 Sat Jan 11 09:46:48 2014 -0800 + Merge pull request #373 from jerryshao/kafka-upgrade + [Upgrade Kafka dependecy to 0.8.0 release version] + + 92ad18b Fri Jan 10 23:25:15 2014 -0800 + Merge pull request #376 from prabeesh/master + [Change clientId to random clientId] + + 0b5ce7a Fri Jan 10 23:23:21 2014 -0800 + Merge pull request #386 from pwendell/typo-fix + [Small typo fix] + + 1d7bef0 Fri Jan 10 18:53:03 2014 -0800 + Merge pull request #381 from mateiz/default-ttl + [Fix default TTL for metadata cleaner] + + 44d6a8e Fri Jan 10 17:51:50 2014 -0800 + Merge pull request #382 from RongGu/master + [Fix a type error in comment lines] + + 88faa30 Fri Jan 10 17:14:22 2014 -0800 + Merge pull request #385 from shivaram/add-i2-instances + [Add i2 instance types to Spark EC2.] + + f265531 Fri Jan 10 16:25:44 2014 -0800 + Merge pull request #383 from tdas/driver-test + [API for automatic driver recovery for streaming programs and other bug fixes] + + d37408f Fri Jan 10 16:25:01 2014 -0800 + Merge pull request #377 from andrewor14/master + [External Sorting for Aggregator and CoGroupedRDDs (Revisited)] + + 0eaf01c Fri Jan 10 15:32:19 2014 -0800 + Merge pull request #369 from pillis/master + [SPARK-961 Add a Vector.random() method] + + 7cef843 Fri Jan 10 15:34:15 2014 -0600 + Merge pull request #371 from tgravescs/yarn_client_addjar_misc_fixes + [Yarn client addjar and misc fixes] + + 7b58f11 Fri Jan 10 12:47:46 2014 -0800 + Merge pull request #384 from pwendell/debug-logs + [Make DEBUG-level logs consummable.] + + 23d2995 Fri Jan 10 10:20:02 2014 -0800 + Merge pull request #1 from jegonzal/graphx + [ProgrammingGuide] + + 0ebc973 Thu Jan 9 23:58:49 2014 -0800 + Merge pull request #375 from mateiz/option-fix + [Fix bug added when we changed AppDescription.maxCores to an Option] + + dd03cea Thu Jan 9 23:38:03 2014 -0800 + Merge pull request #378 from pwendell/consolidate_on + [Enable shuffle consolidation by default.] + + 997c830 Thu Jan 9 22:22:20 2014 -0800 + Merge pull request #363 from pwendell/streaming-logs + [Set default logging to WARN for Spark streaming examples.] + + 300eaa9 Thu Jan 9 20:29:51 2014 -0800 + Merge pull request #353 from pwendell/ipython-simplify + [Simplify and fix pyspark script.] + + 4b074fa Thu Jan 9 19:03:55 2014 -0800 + Merge pull request #374 from mateiz/completeness + [Add some missing Java API methods] + + a9d5333 Thu Jan 9 18:46:46 2014 -0800 + Merge pull request #294 from RongGu/master + [Bug fixes for updating the RDD block's memory and disk usage information] + + d86a85e Thu Jan 9 18:37:52 2014 -0800 + Merge pull request #293 from pwendell/standalone-driver + [SPARK-998: Support Launching Driver Inside of Standalone Mode] + + 26cdb5f Thu Jan 9 17:16:34 2014 -0800 + Merge pull request #372 from pwendell/log4j-fix-1 + [Send logs to stderr by default (instead of stdout).] + + 12f414e Thu Jan 9 15:31:30 2014 -0800 + Merge pull request #362 from mateiz/conf-getters + [Use typed getters for configuration settings] + + 365cac9 Thu Jan 9 00:56:16 2014 -0800 + Merge pull request #361 from rxin/clean + [Minor style cleanup. Mostly on indenting & line width changes.] + + 73c724e Thu Jan 9 00:32:19 2014 -0800 + Merge pull request #368 from pwendell/sbt-fix + [Don't delegate to users `sbt`.] + + dceedb4 Wed Jan 8 23:19:28 2014 -0800 + Merge pull request #364 from pwendell/fix + [Fixing config option "retained_stages" => "retainedStages".] + + 04d83fc Wed Jan 8 11:55:37 2014 -0800 + Merge pull request #360 from witgo/master + [fix make-distribution.sh show version: command not found] + + 56ebfea Wed Jan 8 11:50:06 2014 -0800 + Merge pull request #357 from hsaputra/set_boolean_paramname + [Set boolean param name for call to SparkHadoopMapReduceUtil.newTaskAttemptID] + + bdeaeaf Wed Jan 8 11:48:39 2014 -0800 + Merge pull request #358 from pwendell/add-cdh + [Add CDH Repository to Maven Build] + + 5cae05f Wed Jan 8 11:47:28 2014 -0800 + Merge pull request #356 from hsaputra/remove_deprecated_cleanup_method + [Remove calls to deprecated mapred's OutputCommitter.cleanupJob] + + 6eef78d Wed Jan 8 08:49:20 2014 -0600 + Merge pull request #345 from colorant/yarn + [support distributing extra files to worker for yarn client mode] + + bb6a39a Tue Jan 7 22:32:18 2014 -0800 + Merge pull request #322 from falaki/MLLibDocumentationImprovement + [SPARK-1009 Updated MLlib docs to show how to use it in Python] + + cb1b927 Tue Jan 7 22:26:28 2014 -0800 + Merge pull request #355 from ScrapCodes/patch-1 + [Update README.md] + + c0f0155 Tue Jan 7 22:21:52 2014 -0800 + Merge pull request #313 from tdas/project-refactor + [Refactored the streaming project to separate external libraries like Twitter, Kafka, Flume, etc.] + + f5f12dc Tue Jan 7 21:56:35 2014 -0800 + Merge pull request #336 from liancheng/akka-remote-lookup + [Get rid of `Either[ActorRef, ActorSelection]'] + + 11891e6 Wed Jan 8 00:32:18 2014 -0500 + Merge pull request #327 from lucarosellini/master + [Added ‘-i’ command line option to Spark REPL] + + 7d0aac9 Wed Jan 8 00:30:45 2014 -0500 + Merge pull request #354 from hsaputra/addasfheadertosbt + [Add ASF header to the new sbt script.] + + d75dc42 Wed Jan 8 00:30:03 2014 -0500 + Merge pull request #350 from mateiz/standalone-limit + [Add way to limit default # of cores used by apps in standalone mode] + + 61674bc Tue Jan 7 18:32:13 2014 -0800 + Merge pull request #352 from markhamstra/oldArch + [Don't leave os.arch unset after BlockManagerSuite] + + b2e690f Tue Jan 7 16:57:08 2014 -0800 + Merge pull request #328 from falaki/MatrixFactorizationModel-fix + [SPARK-1012: DAGScheduler Exception Fix] + + 6ccf8ce Tue Jan 7 15:49:14 2014 -0800 + Merge pull request #351 from pwendell/maven-fix + [Add log4j exclusion rule to maven.] + + 7d5fa17 Tue Jan 7 11:31:34 2014 -0800 + Merge pull request #337 from yinxusen/mllib-16-bugfix + [Mllib 16 bugfix] + + 71fc113 Tue Jan 7 11:30:35 2014 -0800 + Merge pull request #349 from CodingCat/support-worker_dir + [add the comments about SPARK_WORKER_DIR] + + 15d9534 Tue Jan 7 08:10:02 2014 -0800 + Merge pull request #318 from srowen/master + [Suggested small changes to Java code for slightly more standard style, encapsulation and in some cases performance] + + 468af0f Tue Jan 7 08:09:01 2014 -0800 + Merge pull request #348 from prabeesh/master + [spark -> org.apache.spark] + + c3cf047 Tue Jan 7 00:54:25 2014 -0800 + Merge pull request #339 from ScrapCodes/conf-improvements + [Conf improvements] + + a862caf Tue Jan 7 00:18:20 2014 -0800 + Merge pull request #331 from holdenk/master + [Add a script to download sbt if not present on the system] + + b97ef21 Mon Jan 6 20:12:57 2014 -0800 + Merge pull request #346 from sproblvem/patch-1 + [Update stop-slaves.sh] + + 7210257 Mon Jan 6 18:25:44 2014 -0800 + Merge pull request #128 from adamnovak/master + [Fix failing "sbt/sbt publish-local" by adding a no-argument PrimitiveKeyOpenHashMap constructor ] + + e4d6057 Mon Jan 6 14:56:54 2014 -0800 + Merge pull request #343 from pwendell/build-fix + [Fix test breaking downstream builds] + + 93bf962 Mon Jan 6 11:42:41 2014 -0800 + Merge pull request #340 from ScrapCodes/sbt-fixes + [Made java options to be applied during tests so that they become self explanatory.] + + 60edeb3 Mon Jan 6 11:40:32 2014 -0800 + Merge pull request #338 from ScrapCodes/ning-upgrade + [SPARK-1005 Ning upgrade] + + c708e81 Mon Jan 6 11:35:48 2014 -0800 + Merge pull request #341 from ash211/patch-5 + [Clarify spark.cores.max in docs] + + 33fcb91 Mon Jan 6 11:19:23 2014 -0800 + Merge pull request #342 from tgravescs/fix_maven_protobuf + [Change protobuf version for yarn alpha back to 2.4.1] + + 357083c Mon Jan 6 10:29:04 2014 -0800 + Merge pull request #330 from tgravescs/fix_addjars_null_handling + [Fix handling of empty SPARK_EXAMPLES_JAR] + + a2e7e04 Sun Jan 5 22:37:36 2014 -0800 + Merge pull request #333 from pwendell/logging-silence + [Quiet ERROR-level Akka Logs] + + 5b0986a Sun Jan 5 19:25:09 2014 -0800 + Merge pull request #334 from pwendell/examples-fix + [Removing SPARK_EXAMPLES_JAR in the code] + + f4b924f Sun Jan 5 17:11:47 2014 -0800 + Merge pull request #335 from rxin/ser + [Fall back to zero-arg constructor for Serializer initialization if there is no constructor that accepts SparkConf.] + + d43ad3e Sat Jan 4 16:29:30 2014 -0800 + Merge pull request #292 from soulmachine/naive-bayes + [standard Naive Bayes classifier] + + 86404da Sat Jan 4 14:55:54 2014 -0800 + Merge pull request #127 from jegonzal/MapByPartition + [Adding mapEdges and mapTriplets by Partition] + + e68cdb1 Sat Jan 4 13:46:02 2014 -0800 + Merge pull request #124 from jianpingjwang/master + [refactor and bug fix] + + 280ddf6 Sat Jan 4 12:54:41 2014 -0800 + Merge pull request #121 from ankurdave/more-simplify + [Simplify GraphImpl internals further] + + 10fe23b Fri Jan 3 23:50:14 2014 -0800 + Merge pull request #329 from pwendell/remove-binaries + [SPARK-1002: Remove Binaries from Spark Source] + + c4d6145 Fri Jan 3 16:30:53 2014 -0800 + Merge pull request #325 from witgo/master + [Modify spark on yarn to create SparkConf process] + + 4ae101f Fri Jan 3 11:24:35 2014 -0800 + Merge pull request #317 from ScrapCodes/spark-915-segregate-scripts + [Spark-915 segregate scripts] + + 87248bd Fri Jan 3 00:45:31 2014 -0800 + Merge pull request #1 from apache/master + [Merge latest Spark changes] + + 30b9db0 Thu Jan 2 23:15:55 2014 -0800 + Merge pull request #285 from colorant/yarn-refactor + [Yarn refactor] + + 498a5f0 Thu Jan 2 19:06:40 2014 -0800 + Merge pull request #323 from tgravescs/sparkconf_yarn_fix + [fix spark on yarn after the sparkConf changes] + + 0475ca8 Thu Jan 2 15:17:08 2014 -0800 + Merge pull request #320 from kayousterhout/erroneous_failed_msg + [Remove erroneous FAILED state for killed tasks.] + + 588a169 Thu Jan 2 13:20:54 2014 -0800 + Merge pull request #297 from tdas/window-improvement + [Improvements to DStream window ops and refactoring of Spark's CheckpointSuite] + + 5e67cdc Thu Jan 2 12:56:28 2014 -0800 + Merge pull request #319 from kayousterhout/remove_error_method + [Removed redundant TaskSetManager.error() function.] + + ca67909 Thu Jan 2 15:54:54 2014 -0500 + Merge pull request #311 from tmyklebu/master + [SPARK-991: Report information gleaned from a Python stacktrace in the UI] + + 3713f81 Wed Jan 1 21:29:12 2014 -0800 + Merge pull request #309 from mateiz/conf2 + [SPARK-544. Migrate configuration to a SparkConf class] + + c1d928a Wed Jan 1 17:03:48 2014 -0800 + Merge pull request #312 from pwendell/log4j-fix-2 + [SPARK-1008: Logging improvments] + + dc9cb83 Wed Jan 1 13:28:34 2014 -0800 + Merge pull request #126 from jegonzal/FixingPersist + [Fixing Persist Behavior] + + 9a0ff72 Tue Dec 31 21:50:24 2013 -0800 + Merge pull request #314 from witgo/master + [restore core/pom.xml file modification] + + 8b8e70e Tue Dec 31 17:48:24 2013 -0800 + Merge pull request #73 from falaki/ApproximateDistinctCount + [Approximate distinct count] + + 63b411d Tue Dec 31 14:31:28 2013 -0800 + Merge pull request #238 from ngbinh/upgradeNetty + [upgrade Netty from 4.0.0.Beta2 to 4.0.13.Final] + + 32d6ae9 Tue Dec 31 13:51:07 2013 -0800 + Merge pull request #120 from ankurdave/subgraph-reuses-view + [Reuse VTableReplicated in GraphImpl.subgraph] + + 55b7e2f Tue Dec 31 10:12:51 2013 -0800 + Merge pull request #289 from tdas/filestream-fix + [Bug fixes for file input stream and checkpointing] + + 2b71ab9 Mon Dec 30 11:01:30 2013 -0800 + Merge pull request from aarondav: Utilize DiskBlockManager pathway for temp file writing + [This gives us a couple advantages:] + + 50e3b8e Mon Dec 30 07:44:26 2013 -0800 + Merge pull request #308 from kayousterhout/stage_naming + [Changed naming of StageCompleted event to be consistent] + + 72a17b6 Sat Dec 28 21:25:40 2013 -1000 + Revert "Merge pull request #310 from jyunfan/master" + [This reverts commit 79b20e4dbe3dcd8559ec8316784d3334bb55868b, reversing] + + 79b20e4 Sat Dec 28 21:13:36 2013 -1000 + Merge pull request #310 from jyunfan/master + [Fix typo in the Accumulators section] + + 7375047 Sat Dec 28 13:25:06 2013 -0800 + Merge pull request #304 from kayousterhout/remove_unused + [Removed unused failed and causeOfFailure variables (in TaskSetManager)] + + ad3dfd1 Fri Dec 27 22:10:14 2013 -0500 + Merge pull request #307 from kayousterhout/other_failure + [Removed unused OtherFailure TaskEndReason.] + + b579b83 Fri Dec 27 22:09:04 2013 -0500 + Merge pull request #306 from kayousterhout/remove_pending + [Remove unused hasPendingTasks methods] + + 19672dc Fri Dec 27 13:37:10 2013 -0800 + Merge pull request #305 from kayousterhout/line_spacing + [Fixed >100char lines in DAGScheduler.scala] + + 7be1e57 Thu Dec 26 23:41:40 2013 -1000 + Merge pull request #298 from aarondav/minor + [Minor: Decrease margin of left side of Log page] + + 7d811ba Thu Dec 26 23:39:58 2013 -1000 + Merge pull request #302 from pwendell/SPARK-1007 + [SPARK-1007: spark-class2.cmd should change SCALA_VERSION to be 2.10] + + 5e69fc5 Thu Dec 26 19:10:39 2013 -0500 + Merge pull request #295 from markhamstra/JobProgressListenerNPE + [Avoid a lump of coal (NPE) in JobProgressListener's stocking.] + + da20270 Thu Dec 26 12:11:52 2013 -0800 + Merge pull request #1 from aarondav/driver + [Refactor DriverClient to be more Actor-based] + + e240bad Thu Dec 26 12:30:48 2013 -0500 + Merge pull request #296 from witgo/master + [Renamed ClusterScheduler to TaskSchedulerImpl for yarn and new-yarn package] + + c344ed0 Thu Dec 26 01:31:06 2013 -0500 + Merge pull request #283 from tmyklebu/master + [Python bindings for mllib] + + 56094bc Wed Dec 25 13:14:33 2013 -0500 + Merge pull request #290 from ash211/patch-3 + [Typo: avaiable -> available] + + 4842a07 Wed Dec 25 01:52:15 2013 -0800 + Merge pull request #287 from azuryyu/master + [Fixed job name in the java streaming example.] + + 85a344b Tue Dec 24 16:35:06 2013 -0800 + Merge pull request #127 from kayousterhout/consolidate_schedulers + [Deduplicate Local and Cluster schedulers.] + + c2dd6bc Tue Dec 24 14:36:47 2013 -0800 + Merge pull request #279 from aarondav/shuffle-cleanup0 + [Clean up shuffle files once their metadata is gone] + + 3bf7c70 Tue Dec 24 16:37:13 2013 -0500 + Merge pull request #275 from ueshin/wip/changeclasspathorder + [Change the order of CLASSPATH.] + + d63856c Mon Dec 23 22:07:26 2013 -0800 + Merge pull request #286 from rxin/build + [Show full stack trace and time taken in unit tests.] + + 23a9ae6 Tue Dec 24 00:08:48 2013 -0500 + Merge pull request #277 from tdas/scheduler-update + [Refactored the streaming scheduler and added StreamingListener interface] + + 11107c9 Mon Dec 23 10:38:20 2013 -0800 + Merge pull request #244 from leftnoteasy/master + [Added SPARK-968 implementation for review] + + 44e4205 Sun Dec 22 11:44:18 2013 -0800 + Merge pull request #116 from jianpingjwang/master + [remove unused variables and fix a bug] + + 4797c22 Fri Dec 20 13:30:39 2013 -0800 + Merge pull request #118 from ankurdave/VertexPartitionSuite + [Test VertexPartition and fix bugs] + + 0bc57c5 Fri Dec 20 11:56:54 2013 -0800 + Merge pull request #280 from aarondav/minor + [Minor cleanup for standalone scheduler] + + ac70b8f Fri Dec 20 10:56:10 2013 -0800 + Merge pull request #117 from ankurdave/more-tests + [More tests] + + 45310d4 Thu Dec 19 22:08:20 2013 -0800 + Merge pull request #115 from ankurdave/test-reorg + [Reorganize unit tests; improve GraphSuite test coverage] + + 9228ec8 Thu Dec 19 21:37:15 2013 -0800 + Merge pull request #1 from aarondav/127 + [Merge master into 127] + + eca68d4 Thu Dec 19 18:12:22 2013 -0800 + Merge pull request #272 from tmyklebu/master + [Track and report task result serialisation time.] + + 7990c56 Thu Dec 19 13:35:09 2013 -0800 + Merge pull request #276 from shivaram/collectPartition + [Add collectPartition to JavaRDD interface.] + + 440e531 Thu Dec 19 10:38:56 2013 -0800 + Merge pull request #278 from MLnick/java-python-tostring + [Add toString to Java RDD, and __repr__ to Python RDD] + + d8d3f3e Thu Dec 19 00:06:43 2013 -0800 + Merge pull request #183 from aarondav/spark-959 + [[SPARK-959] Explicitly depend on org.eclipse.jetty.orbit jar] + + bfba532 Wed Dec 18 22:22:21 2013 -0800 + Merge pull request #247 from aarondav/minor + [Increase spark.akka.askTimeout default to 30 seconds] + + da301b5 Wed Dec 18 20:03:29 2013 -0800 + Merge pull request #112 from amatsukawa/scc + [Strongly connected component algorithm] + + c64a53a Wed Dec 18 16:56:26 2013 -0800 + Merge pull request #267 from JoshRosen/cygwin + [Fix Cygwin support in several scripts.] + + a645ef6 Wed Dec 18 16:07:52 2013 -0800 + Merge pull request #48 from amatsukawa/add_project_to_graph + [Add mask operation on graph and filter graph primitive] + + d7ebff0 Wed Dec 18 15:38:48 2013 -0800 + Merge pull request #1 from ankurdave/add_project_to_graph + [Merge current master and reimplement Graph.mask using innerJoin] + + 5ea1872 Wed Dec 18 15:27:24 2013 -0800 + Merge pull request #274 from azuryy/master + [Fixed the example link in the Scala programing guid.] + + 3fd2e09 Wed Dec 18 12:52:36 2013 -0800 + Merge pull request #104 from jianpingjwang/master + [SVD++ demo] + + f4effb3 Tue Dec 17 22:26:21 2013 -0800 + Merge pull request #273 from rxin/top + [Fixed a performance problem in RDD.top and BoundedPriorityQueue] + + 1b5eacb Tue Dec 17 13:49:17 2013 -0800 + Merge pull request #102 from ankurdave/clustered-edge-index + [Add clustered index on edges by source vertex] + + 7a8169b Mon Dec 16 22:42:21 2013 -0800 + Merge pull request #268 from pwendell/shaded-protobuf + [Add support for 2.2. to master (via shaded jars)] + + 0476c84 Mon Dec 16 17:19:25 2013 -0800 + Merge pull request #100 from ankurdave/mrTriplets-active-set + [Support activeSet option in mapReduceTriplets] + + 964a3b6 Mon Dec 16 15:23:51 2013 -0800 + Merge pull request #270 from ewencp/really-force-ssh-pseudo-tty-master + [Force pseudo-tty allocation in spark-ec2 script.] + + 5192ef3 Mon Dec 16 15:08:08 2013 -0800 + Merge pull request #94 from ankurdave/load-edges-columnar + [Load edges in columnar format] + + 883e034 Mon Dec 16 14:16:02 2013 -0800 + Merge pull request #245 from gregakespret/task-maxfailures-fix + [Fix for spark.task.maxFailures not enforced correctly.] + + a51f340 Sun Dec 15 22:02:30 2013 -0800 + Merge pull request #265 from markhamstra/scala.binary.version + [DRY out the POMs with scala.binary.version] + + ded10ce Sun Dec 15 17:25:33 2013 -0800 + Merge pull request #103 from amplab/optimizations + [Optimizations cherry-picked from SIGMOD branches] + + d2ced6d Sun Dec 15 14:11:34 2013 -0800 + Merge pull request #256 from MLnick/master + [Fix 'IPYTHON=1 ./pyspark' throwing ValueError] + + c55e698 Sun Dec 15 12:49:02 2013 -0800 + Merge pull request #257 from tgravescs/sparkYarnFixName + [Fix the --name option for Spark on Yarn] + + ab85f88 Sun Dec 15 12:48:32 2013 -0800 + Merge pull request #264 from shivaram/spark-class-fix + [Use CoarseGrainedExecutorBackend in spark-class] + + 8a56c1f Sat Dec 14 16:29:24 2013 -0800 + Merge pull request #84 from amatsukawa/graphlab_enhancements + [GraphLab bug fix & set start vertex] + + 7db9165 Sat Dec 14 14:16:34 2013 -0800 + Merge pull request #251 from pwendell/master + [Fix list rendering in YARN markdown docs.] + + 2fd781d Sat Dec 14 12:59:37 2013 -0800 + Merge pull request #249 from ngbinh/partitionInJavaSortByKey + [Expose numPartitions parameter in JavaPairRDD.sortByKey()] + + 9bf192b Sat Dec 14 12:52:18 2013 -0800 + Merge pull request #91 from amplab/standalone-pagerank + [Standalone PageRank] + + 840af5e Sat Dec 14 12:51:51 2013 -0800 + Merge pull request #99 from ankurdave/only-dynamic-pregel + [Remove static Pregel; take maxIterations in dynamic Pregel] + + 97ac060 Sat Dec 14 00:22:45 2013 -0800 + Merge pull request #259 from pwendell/scala-2.10 + [Migration to Scala 2.10] + + 7ac944f Fri Dec 13 23:22:08 2013 -0800 + Merge pull request #262 from pwendell/mvn-fix + [Fix maven build issues in 2.10 branch] + + 6defb06 Fri Dec 13 21:18:57 2013 -0800 + Merge pull request #261 from ScrapCodes/scala-2.10 + [Added a comment about ActorRef and ActorSelection difference.] + + 76566b1 Fri Dec 13 10:11:02 2013 -0800 + Merge pull request #260 from ScrapCodes/scala-2.10 + [Review comments on the PR for scala 2.10 migration.] + + 0aeb182 Thu Dec 12 21:14:42 2013 -0800 + Merge pull request #255 from ScrapCodes/scala-2.10 + [Disabled yarn 2.2 in sbt and mvn build and added a message in the sbt build.] + + 2e89398 Wed Dec 11 23:10:53 2013 -0800 + Merge pull request #254 from ScrapCodes/scala-2.10 + [Scala 2.10 migration] + + ce6ca4e Wed Dec 11 22:30:54 2013 -0800 + Merge pull request #97 from dcrankshaw/fix-rddtop + [Added BoundedPriorityQueue kryo registrator. Fixes top issue.] + + d2efe13 Tue Dec 10 13:01:26 2013 -0800 + Merge pull request #250 from pwendell/master + [README incorrectly suggests build sources spark-env.sh] + + 6169fe1 Mon Dec 9 16:51:36 2013 -0800 + Merge pull request #246 from pwendell/master + [Add missing license headers] + + d992ec6 Sun Dec 8 20:49:20 2013 -0800 + Merge pull request #195 from dhardy92/fix_DebScriptPackage + [[Deb] fix package of Spark classes adding org.apache prefix in scripts embeded in .deb] + + 1f4a4bc Sat Dec 7 22:34:34 2013 -0800 + Merge pull request #242 from pwendell/master + [Update broken links and add HDP 2.0 version string] + + 6494d62 Sat Dec 7 11:56:16 2013 -0800 + Merge pull request #240 from pwendell/master + [SPARK-917 Improve API links in nav bar] + + f466f79 Sat Dec 7 11:51:52 2013 -0800 + Merge pull request #239 from aarondav/nit + [Correct spellling error in configuration.md] + + 3abfbfb Sat Dec 7 11:24:19 2013 -0800 + Merge pull request #92 from ankurdave/rdd-names + [Set RDD names for easy debugging] + + 31e8a14 Fri Dec 6 21:49:55 2013 -0800 + Merge pull request #90 from amplab/pregel-replicate-changed + [Replicate only changed vertices] + + 10c3c0c Fri Dec 6 20:29:45 2013 -0800 + Merge pull request #237 from pwendell/formatting-fix + [Formatting fix] + + 1b38f5f Fri Dec 6 20:16:15 2013 -0800 + Merge pull request #236 from pwendell/shuffle-docs + [Adding disclaimer for shuffle file consolidation] + + e5d5728 Fri Dec 6 20:14:56 2013 -0800 + Merge pull request #235 from pwendell/master + [Minor doc fixes and updating README] + + 241336a Fri Dec 6 17:29:03 2013 -0800 + Merge pull request #234 from alig/master + [Updated documentation about the YARN v2.2 build process] + + e039234 Fri Dec 6 11:49:59 2013 -0800 + Merge pull request #190 from markhamstra/Stages4Jobs + [stageId <--> jobId mapping in DAGScheduler] + + bfa6860 Fri Dec 6 11:04:03 2013 -0800 + Merge pull request #233 from hsaputra/changecontexttobackend + [Change the name of input argument in ClusterScheduler#initialize from context to backend.] + + 3fb302c Fri Dec 6 11:03:32 2013 -0800 + Merge pull request #205 from kayousterhout/logging + [Added logging of scheduler delays to UI] + + 87676a6 Fri Dec 6 11:01:42 2013 -0800 + Merge pull request #220 from rxin/zippart + [Memoize preferred locations in ZippedPartitionsBaseRDD] + + 0780498 Thu Dec 5 23:29:42 2013 -0800 + Merge pull request #232 from markhamstra/FiniteWait + [jobWaiter.synchronized before jobWaiter.wait] + + 1c8500e Thu Dec 5 16:25:44 2013 -0800 + Merge pull request #88 from amplab/varenc + [Fixed a bug that variable encoding doesn't work for ints that use all 64 bits.] + + e0bcaa0 Thu Dec 5 12:37:02 2013 -0800 + Merge pull request #86 from ankurdave/vid-varenc + [Finish work on #85] + + 5d46025 Thu Dec 5 12:31:24 2013 -0800 + Merge pull request #228 from pwendell/master + [Document missing configs and set shuffle consolidation to false.] + + 3e96b9a Thu Dec 5 12:07:36 2013 -0800 + Merge pull request #85 from ankurdave/vid-varenc + [Always write Vids using variable encoding] + + 72b6961 Wed Dec 4 23:33:04 2013 -0800 + Merge pull request #199 from harveyfeng/yarn-2.2 + [Hadoop 2.2 migration] + + e0347ba Wed Dec 4 17:38:06 2013 -0800 + Merge pull request #83 from ankurdave/fix-tests + [Fix compile errors in GraphSuite and SerializerSuite] + + 182f9ba Wed Dec 4 15:52:07 2013 -0800 + Merge pull request #227 from pwendell/master + [Fix small bug in web UI and minor clean-up.] + + cbd3b75 Wed Dec 4 15:35:26 2013 -0800 + Merge pull request #81 from amplab/clean1 + [Codebase refactoring] + + b9e7609 Wed Dec 4 14:42:09 2013 -0800 + Merge pull request #225 from ash211/patch-3 + [Add missing space after "Serialized" in StorageLevel] + + 055462c Wed Dec 4 14:02:11 2013 -0800 + Merge pull request #226 from ash211/patch-4 + [Typo: applicaton] + + d6e5473 Wed Dec 4 10:28:50 2013 -0800 + Merge pull request #223 from rxin/transient + [Mark partitioner, name, and generator field in RDD as @transient.] + + 8a3475a Tue Dec 3 14:21:40 2013 -0800 + Merge pull request #218 from JoshRosen/spark-970-pyspark-unicode-error + [Fix UnicodeEncodeError in PySpark saveAsTextFile() (SPARK-970)] + + 46b87b8 Tue Dec 3 00:41:11 2013 -0800 + Merge pull request #2 from colorant/yarn-client-2.2 + [Fix pom.xml for maven build] + + 58d9bbc Mon Dec 2 21:58:53 2013 -0800 + Merge pull request #217 from aarondav/mesos-urls + [Re-enable zk:// urls for Mesos SparkContexts] + + 740922f Sun Dec 1 12:46:58 2013 -0800 + Merge pull request #219 from sundeepn/schedulerexception + [Scheduler quits when newStage fails] + + 60e23a5 Sat Nov 30 23:38:49 2013 -0800 + Merge pull request #216 from liancheng/fix-spark-966 + [Bugfix: SPARK-965 & SPARK-966] + + 34ee814 Sat Nov 30 15:10:30 2013 -0800 + Merged Ankur's pull request #80 and fixed subgraph. + [] + + 743a31a Wed Nov 27 18:24:39 2013 -0800 + Merge pull request #210 from haitaoyao/http-timeout + [add http timeout for httpbroadcast] + + 993e293 Wed Nov 27 00:57:54 2013 -0800 + Merge pull request #1 from colorant/yarn-client-2.2 + [Port yarn-client mode for new-yarn] + + fb6875d Tue Nov 26 20:55:40 2013 -0800 + Merge pull request #146 from JoshRosen/pyspark-custom-serializers + [Custom Serializers for PySpark] + + 330ada1 Tue Nov 26 19:08:33 2013 -0800 + Merge pull request #207 from henrydavidge/master + [Log a warning if a task's serialized size is very big] + + 615213f Tue Nov 26 19:07:20 2013 -0800 + Merge pull request #212 from markhamstra/SPARK-963 + [[SPARK-963] Fixed races in JobLoggerSuite] + + cb976df Tue Nov 26 10:23:19 2013 -0800 + Merge pull request #209 from pwendell/better-docs + [Improve docs for shuffle instrumentation] + + 18d6df0 Tue Nov 26 00:00:07 2013 -0800 + Merge pull request #86 from holdenk/master + [Add histogram functionality to DoubleRDDFunctions] + + 0e2109d Mon Nov 25 20:48:37 2013 -0800 + Merge pull request #204 from rxin/hash + [OpenHashSet fixes] + + c46067f Mon Nov 25 19:09:31 2013 -0800 + Merge pull request #206 from ash211/patch-2 + [Update tuning.md] + + 14bb465 Mon Nov 25 18:50:18 2013 -0800 + Merge pull request #201 from rxin/mappartitions + [Use the proper partition index in mapPartitionsWIthIndex] + + eb4296c Mon Nov 25 15:25:29 2013 -0800 + Merge pull request #101 from colorant/yarn-client-scheduler + [For SPARK-527, Support spark-shell when running on YARN] + + 466fd06 Mon Nov 25 18:27:26 2013 +0800 + Incorporated ideas from pull request #200. - Use Murmur Hash 3 finalization step to scramble the bits of HashCode instead of the simpler version in java.util.HashMap; the latter one had trouble with ranges of consecutive integers. Murmur Hash 3 is used by fastutil. + [- Don't check keys for equality when re-inserting due to growing the] + + 088995f Mon Nov 25 00:57:51 2013 -0800 + Merge pull request #77 from amplab/upgrade + [Sync with Spark master] + + 62889c4 Mon Nov 25 11:27:45 2013 +0800 + Merge pull request #203 from witgo/master + [ Fix Maven build for metrics-graphite] + + 6af03ed Sun Nov 24 16:42:37 2013 -0800 + Merge pull request #76 from dcrankshaw/fix_partitioners + [Actually use partitioner command line args in Analytics.] + + 859d62d Sun Nov 24 16:19:51 2013 -0800 + Merge pull request #151 from russellcardullo/add-graphite-sink + [Add graphite sink for metrics] + + 65de73c Sun Nov 24 15:52:33 2013 -0800 + Merge pull request #185 from mkolod/random-number-generator + [XORShift RNG with unit tests and benchmark] + + 972171b Mon Nov 25 07:50:46 2013 +0800 + Merge pull request #197 from aarondav/patrick-fix + [Fix 'timeWriting' stat for shuffle files] + + a1a7e36 Sun Nov 24 05:15:09 2013 -0800 + Merge pull request #75 from amplab/simplify + [Simplify GraphImpl internals] + + 718cc80 Sun Nov 24 11:02:02 2013 +0800 + Merge pull request #200 from mateiz/hash-fix + [AppendOnlyMap fixes] + + 51aa9d6 Sat Nov 23 19:46:46 2013 +0800 + Merge pull request #198 from ankurdave/zipPartitions-preservesPartitioning + [Support preservesPartitioning in RDD.zipPartitions] + + 18ce7e9 Fri Nov 22 17:02:40 2013 -0800 + Merge pull request #73 from jegonzal/TriangleCount + [Triangle count] + + 086b097 Fri Nov 22 10:26:39 2013 +0800 + Merge pull request #193 from aoiwelle/patch-1 + [Fix Kryo Serializer buffer documentation inconsistency] + + f20093c Fri Nov 22 10:12:13 2013 +0800 + Merge pull request #196 from pwendell/master + [TimeTrackingOutputStream should pass on calls to close() and flush().] + + 4b89501 Wed Nov 20 10:36:10 2013 -0800 + Merge pull request #191 from hsaputra/removesemicolonscala + [Cleanup to remove semicolons (;) from Scala code] + + 202f8e6 Wed Nov 20 03:26:08 2013 -0800 + Merge pull request #74 from dcrankshaw/remove_sleep + [Removed sleep from pagerank in Analytics] + + 74ade9e Tue Nov 19 16:53:58 2013 -0800 + Merge pull request #62 from dcrankshaw/partitioners + [Allow user to choose a partitioner at runtime] + + f568912 Tue Nov 19 16:11:31 2013 -0800 + Merge pull request #181 from BlackNiuza/fix_tasks_number + [correct number of tasks in ExecutorsUI] + + aa638ed Tue Nov 19 16:05:44 2013 -0800 + Merge pull request #189 from tgravescs/sparkYarnErrorHandling + [Impove Spark on Yarn Error handling] + + 5592580 Tue Nov 19 16:04:01 2013 -0800 + Merge pull request #187 from aarondav/example-bcast-test + [Enable the Broadcast examples to work in a cluster setting] + + 99cfe89 Mon Nov 18 22:00:36 2013 -0500 + Updates to reflect pull request code review + [] + + e2ebc3a Sun Nov 17 18:42:18 2013 -0800 + Merge pull request #182 from rxin/vector + [Slightly enhanced PrimitiveVector:] + + 26f616d Sun Nov 17 18:18:16 2013 -0800 + Merge pull request #3 from aarondav/pv-test + [Add PrimitiveVectorSuite and fix bug in resize()] + + 1b5b358 Sat Nov 16 11:44:10 2013 -0800 + Merge pull request #178 from hsaputra/simplecleanupcode + [Simple cleanup on Spark's Scala code] + + 62a2a71 Fri Nov 15 13:12:07 2013 -0800 + Merge pull request #65 from amplab/varenc + [Use variable encoding for ints, longs, and doubles in the specialized serializers.] + + f6b2e59 Thu Nov 14 23:04:55 2013 -0800 + Merge pull request #1 from aarondav/scala210-master + [Various merge corrections] + + 96e0fb4 Thu Nov 14 22:29:28 2013 -0800 + Merge pull request #173 from kayousterhout/scheduler_hang + [Fix bug where scheduler could hang after task failure.] + + dfd40e9 Thu Nov 14 19:44:50 2013 -0800 + Merge pull request #175 from kayousterhout/no_retry_not_serializable + [Don't retry tasks when they fail due to a NotSerializableException] + + ed25105 Thu Nov 14 19:43:55 2013 -0800 + Merge pull request #174 from ahirreddy/master + [Write Spark UI url to driver file on HDFS] + + 1a4cfbe Thu Nov 14 10:32:11 2013 -0800 + Merge pull request #169 from kayousterhout/mesos_fix + [Don't ignore spark.cores.max when using Mesos Coarse mode] + + 5a4f483 Thu Nov 14 10:30:36 2013 -0800 + Merge pull request #170 from liancheng/hadooprdd-doc-typo + [Fixed a scaladoc typo in HadoopRDD.scala] + + d76f520 Thu Nov 14 10:25:48 2013 -0800 + Merge pull request #171 from RIA-pierre-borckmans/master + [Fixed typos in the CDH4 distributions version codes.] + + 2c39d80 Wed Nov 13 23:28:01 2013 -0800 + Merge pull request #69 from jegonzal/MissingVertices + [Addressing issue in Graph creation] + + 33b2dea Wed Nov 13 17:55:58 2013 -0800 + Merge pull request #1 from ankurdave/MissingVertices + [During graph creation, create eTable earlier] + + 2054c61 Wed Nov 13 16:49:55 2013 -0800 + Merge pull request #159 from liancheng/dagscheduler-actor-refine + [Migrate the daemon thread started by DAGScheduler to Akka actor] + + 9290e5b Wed Nov 13 16:48:44 2013 -0800 + Merge pull request #165 from NathanHowell/kerberos-master + [spark-assembly.jar fails to authenticate with YARN ResourceManager] + + a81fcb7 Wed Nov 13 10:41:01 2013 -0800 + Merge pull request #68 from jegonzal/BitSetSetUntilBug + [Addressing bug in BitSet.setUntil(ind)] + + 39af914 Wed Nov 13 08:39:05 2013 -0800 + Merge pull request #166 from ahirreddy/simr-spark-ui + [SIMR Backend Scheduler will now write Spark UI URL to HDFS, which is to ...] + + f49ea28 Tue Nov 12 19:13:39 2013 -0800 + Merge pull request #137 from tgravescs/sparkYarnJarsHdfsRebase + [Allow spark on yarn to be run from HDFS.] + + 87f2f4e Tue Nov 12 16:26:09 2013 -0800 + Merge pull request #153 from ankurdave/stop-spot-cluster + [Enable stopping and starting a spot cluster] + + b8bf04a Tue Nov 12 16:19:50 2013 -0800 + Merge pull request #160 from xiajunluan/JIRA-923 + [Fix bug JIRA-923] + + dfd1ebc Tue Nov 12 09:10:05 2013 -0800 + Merge pull request #164 from tdas/kafka-fix + [Made block generator thread safe to fix Kafka bug.] + + 2e8d450 Mon Nov 11 17:34:09 2013 -0800 + Merge pull request #63 from jegonzal/VertexSetCleanup + [Cleanup of VertexSetRDD] + + b8e294a Mon Nov 11 16:25:42 2013 -0800 + Merge pull request #61 from ankurdave/pid2vid + [Shuffle replicated vertex attributes efficiently in columnar format] + + 3d7277c Mon Nov 11 15:49:28 2013 -0800 + Merge pull request #55 from ankurdave/aggregateNeighbors-variants + [Specialize mapReduceTriplets for accessing subsets of vertex attributes] + + 23b53ef Mon Nov 11 12:30:02 2013 -0800 + Merge pull request #156 from haoyuan/master + [add tachyon module] + + 1a06f70 Sun Nov 10 10:54:44 2013 -0800 + Merge pull request #60 from amplab/rxin + [Looks good to me.] + + 58d4f6c Sun Nov 10 09:23:56 2013 -0800 + Merge pull request #157 from rxin/kryo + [3 Kryo related changes.] + + 3efc019 Sat Nov 9 17:53:49 2013 -0800 + Merge pull request #147 from JoshRosen/fix-java-api-completeness-checker + [Add spark-tools assembly to spark-class'ss classpath] + + 87954d4 Sat Nov 9 17:53:25 2013 -0800 + Merge pull request #154 from soulmachine/ClusterScheduler + [Replace the thread inside ClusterScheduler.start() with an Akka scheduler] + + f6c9462 Sat Nov 9 16:14:45 2013 -0800 + Merge pull request #58 from jegonzal/KryoMessages + [Kryo messages] + + 83bf192 Sat Nov 9 15:40:29 2013 -0800 + Merge pull request #155 from rxin/jobgroup + [Don't reset job group when a new job description is set.] + + 8af99f2 Sat Nov 9 13:48:00 2013 -0800 + Merge pull request #149 from tgravescs/fixSecureHdfsAccess + [Fix secure hdfs access for spark on yarn] + + 72a601e Sat Nov 9 11:55:16 2013 -0800 + Merge pull request #152 from rxin/repl + [Propagate SparkContext local properties from spark-repl caller thread to the repl execution thread.] + + 6ee05be Thu Nov 7 19:12:41 2013 -0800 + Merge pull request #49 from jegonzal/graphxshell + [GraphX Console with Logo Text] + + a9f96b5 Thu Nov 7 18:56:56 2013 -0800 + Merge pull request #56 from jegonzal/PregelAPIChanges + [Changing Pregel API to use mapReduceTriplets instead of aggregateNeighbors] + + 5907137 Thu Nov 7 16:58:31 2013 -0800 + Merge pull request #54 from amplab/rxin + [Converted for loops to while loops in EdgePartition.] + + edf4164 Thu Nov 7 16:22:43 2013 -0800 + Merge pull request #53 from amplab/rxin + [Added GraphX to classpath.] + + c379e10 Thu Nov 7 16:01:47 2013 -0800 + Merge pull request #51 from jegonzal/VertexSetRDD + [Reverting to Array based (materialized) output in VertexSetRDD] + + 3d4ad84 Thu Nov 7 11:08:27 2013 -0800 + Merge pull request #148 from squito/include_appId + [Include appId in executor cmd line args] + + be7e8da Wed Nov 6 23:22:47 2013 -0800 + Merge pull request #23 from jerryshao/multi-user + [Add Spark multi-user support for standalone mode and Mesos] + + aadeda5 Wed Nov 6 13:27:47 2013 -0800 + Merge pull request #144 from liancheng/runjob-clean + [Removed unused return value in SparkContext.runJob] + + 951024f Wed Nov 6 09:36:14 2013 -0800 + Merge pull request #145 from aarondav/sls-fix + [Attempt to fix SparkListenerSuite breakage] + + bf4e613 Tue Nov 5 23:14:09 2013 -0800 + Merge pull request #143 from rxin/scheduler-hang + [Ignore a task update status if the executor doesn't exist anymore.] + + 9f7b9bb Tue Nov 5 10:42:19 2013 -0800 + Merge pull request #142 from liancheng/dagscheduler-pattern-matching + [Using case class deep match to simplify code in DAGScheduler.processEvent] + + ca44b51 Tue Nov 5 01:32:55 2013 -0800 + Merge pull request #50 from amplab/mergemerge + [Merge Spark master into graphx] + + 8106532 Mon Nov 4 20:47:14 2013 -0800 + Merge pull request #139 from aarondav/shuffle-next + [Never store shuffle blocks in BlockManager] + + 0b26a39 Mon Nov 4 18:22:06 2013 -0800 + Merge pull request #128 from shimingfei/joblogger-doc + [add javadoc to JobLogger, and some small fix] + + 7a26104 Mon Nov 4 17:54:06 2013 -0800 + Merge pull request #130 from aarondav/shuffle + [Memory-optimized shuffle file consolidation] + + b5dc339 Sun Nov 3 20:43:15 2013 -0800 + Merge pull request #70 from rxin/hash1 + [Fast, memory-efficient hash set, hash table implementations optimized for primitive data types.] + + 41ead7a Sat Nov 2 14:41:50 2013 -0700 + Merge pull request #133 from Mistobaan/link_fix + [update default github] + + d407c07 Sat Nov 2 14:36:37 2013 -0700 + Merge pull request #134 from rxin/readme + [Fixed a typo in Hadoop version in README.] + + e7c7b80 Fri Nov 1 17:58:10 2013 -0700 + Merge pull request #132 from Mistobaan/doc_fix + [fix persistent-hdfs] + + d6d11c2 Fri Nov 1 15:40:33 2013 -0700 + Merge pull request #129 from velvia/2013-11/document-local-uris + [Document & finish support for local: URIs] + + 99bfcc9 Thu Oct 31 21:38:10 2013 -0700 + Merge pull request #46 from jegonzal/VertexSetWithHashSet + [Switched VertexSetRDD and GraphImpl to use OpenHashSet] + + fcaaf86 Thu Oct 31 18:27:30 2013 -0700 + Merge pull request #44 from jegonzal/rxinBitSet + [Switching to VertexSetRDD to use @rxin BitSet and OpenHash ] + + 3f3c727 Thu Oct 31 09:52:25 2013 -0700 + Merge pull request #41 from jegonzal/LineageTracking + [Optimizing Graph Lineage] + + 944f6b8 Thu Oct 31 09:40:35 2013 -0700 + Merge pull request #43 from amplab/FixBitSetCastException + [Fix BitSet cast exception] + + 8f1098a Wed Oct 30 20:11:48 2013 -0700 + Merge pull request #117 from stephenh/avoid_concurrent_modification_exception + [Handle ConcurrentModificationExceptions in SparkContext init.] + + dc9ce16 Wed Oct 30 17:01:56 2013 -0700 + Merge pull request #126 from kayousterhout/local_fix + [Fixed incorrect log message in local scheduler] + + 33de11c Wed Oct 30 16:58:27 2013 -0700 + Merge pull request #124 from tgravescs/sparkHadoopUtilFix + [Pull SparkHadoopUtil out of SparkEnv (jira SPARK-886)] + + a0c86c3 Wed Oct 30 15:34:39 2013 -0700 + Merge pull request #38 from jegonzal/Documentation + [Improving Documentation] + + 618c1f6 Wed Oct 30 12:03:44 2013 -0700 + Merge pull request #125 from velvia/2013-10/local-jar-uri + [Add support for local:// URI scheme for addJars()] + + 745dc42 Tue Oct 29 23:47:10 2013 -0700 + Merge pull request #118 from JoshRosen/blockinfo-memory-usage + [Reduce the memory footprint of BlockInfo objects] + + 06adf63 Tue Oct 29 16:43:46 2013 -0700 + Merge pull request #33 from kellrott/master + [Fixing graph/pom.xml] + + 098768e Tue Oct 29 15:08:36 2013 -0700 + Merge pull request #37 from jegonzal/AnalyticsCleanup + [Updated Connected Components and Pregel Docs] + + f0e23a0 Tue Oct 29 01:41:44 2013 -0400 + Merge pull request #119 from soulmachine/master + [A little revise for the document] + + aec9bf9 Sun Oct 27 19:32:00 2013 -0700 + Merge pull request #112 from kayousterhout/ui_task_attempt_id + [Display both task ID and task attempt ID in UI, and rename taskId to taskAttemptId] + + d4df474 Sun Oct 27 22:11:21 2013 -0400 + Merge pull request #115 from aarondav/shuffle-fix + [Eliminate extra memory usage when shuffle file consolidation is disabled] + + e018f2d Sat Oct 26 11:39:15 2013 -0700 + Merge pull request #113 from pwendell/master + [Improve error message when multiple assembly jars are present.] + + 662ee9f Sat Oct 26 11:35:59 2013 -0700 + Merge pull request #114 from soulmachine/master + [A little revise for the document] + + bab496c Fri Oct 25 18:28:43 2013 -0700 + Merge pull request #108 from alig/master + [Changes to enable executing by using HDFS as a synchronization point between driver and executors, as well as ensuring executors exit properly.] + + d307db6 Fri Oct 25 17:26:06 2013 -0700 + Merge pull request #102 from tdas/transform + [Added new Spark Streaming operations] + + 85e2cab Fri Oct 25 14:46:06 2013 -0700 + Merge pull request #111 from kayousterhout/ui_name + [Properly display the name of a stage in the UI.] + + ab35ec4 Fri Oct 25 10:16:18 2013 -0700 + Merge pull request #110 from pwendell/master + [Exclude jopt from kafka dependency.] + + 4f2c943 Thu Oct 24 22:32:02 2013 -0700 + Merge pull request #109 from pwendell/master + [Adding Java/Java Streaming versions of `repartition` with associated tests] + + 99ad4a6 Thu Oct 24 17:08:39 2013 -0700 + Merge pull request #106 from pwendell/master + [Add a `repartition` operator.] + + 5429d62 Thu Oct 24 11:15:55 2013 -0700 + Merge pull request #107 from ScrapCodes/scala-2.10 + [Updating to latest akka 2.2.3, which fixes our only failing test Driver Suite.] + + 6f82c42 Thu Oct 24 11:09:46 2013 -0700 + Merge pull request #34 from jegonzal/AnalyticsCleanup + [Analytics Cleanup] + + 1dc776b Wed Oct 23 22:05:52 2013 -0700 + Merge pull request #93 from kayousterhout/ui_new_state + [Show "GETTING_RESULTS" state in UI.] + + c4b187d Wed Oct 23 21:56:18 2013 -0700 + Merge pull request #105 from pwendell/doc-fix + [Fixing broken links in programming guide] + + a098438 Wed Oct 23 18:03:08 2013 -0700 + Merge pull request #103 from JoshRosen/unpersist-fix + [Add unpersist() to JavaDoubleRDD and JavaPairRDD.] + + dd65964 Wed Oct 23 15:07:59 2013 -0700 + Merge pull request #64 from prabeesh/master + [MQTT Adapter for Spark Streaming] + + 452aa36 Tue Oct 22 23:15:33 2013 -0700 + Merge pull request #97 from ewencp/pyspark-system-properties + [Add classmethod to SparkContext to set system properties.] + + 9dfcf53 Tue Oct 22 16:01:42 2013 -0700 + Merge pull request #100 from JoshRosen/spark-902 + [Remove redundant Java Function call() definitions] + + 49d5cda Tue Oct 22 15:38:02 2013 -0700 + Merge pull request #30 from jegonzal/VertexSetRDD_Tests + [Testing and Documenting VertexSetRDD] + + 97184de Tue Oct 22 13:10:14 2013 -0700 + Merge pull request #99 from pwendell/master + [Use correct formatting for comments in StoragePerfTester] + + c404adb Tue Oct 22 11:30:19 2013 -0700 + Merge pull request #90 from pwendell/master + [SPARK-940: Do not directly pass Stage objects to SparkListener.] + + aa9019f Tue Oct 22 10:30:02 2013 -0700 + Merge pull request #98 from aarondav/docs + [Docs: Fix links to RDD API documentation] + + a0e08f0 Tue Oct 22 10:20:43 2013 -0700 + Merge pull request #82 from JoshRosen/map-output-tracker-refactoring + [Split MapOutputTracker into Master/Worker classes] + + b84193c Mon Oct 21 23:35:13 2013 -0700 + Merge pull request #92 from tgravescs/sparkYarnFixClasspath + [Fix the Worker to use CoarseGrainedExecutorBackend and modify classpath ...] + + 731c94e Mon Oct 21 23:31:38 2013 -0700 + Merge pull request #56 from jerryshao/kafka-0.8-dev + [Upgrade Kafka 0.7.2 to Kafka 0.8.0-beta1 for Spark Streaming] + + 48952d6 Mon Oct 21 22:45:00 2013 -0700 + Merge pull request #87 from aarondav/shuffle-base + [Basic shuffle file consolidation] + + a51359c Mon Oct 21 20:33:29 2013 -0700 + Merge pull request #95 from aarondav/perftest + [Minor: Put StoragePerfTester in org/apache/] + + 39d2e9b Mon Oct 21 18:58:48 2013 -0700 + Merge pull request #94 from aarondav/mesos-fix + [Fix mesos urls] + + aa61bfd Mon Oct 21 11:57:05 2013 -0700 + Merge pull request #88 from rxin/clean + [Made the following traits/interfaces/classes non-public:] + + 35886f3 Sun Oct 20 22:20:32 2013 -0700 + Merge pull request #41 from pwendell/shuffle-benchmark + [Provide Instrumentation for Shuffle Write Performance] + + 5b9380e Sun Oct 20 21:03:51 2013 -0700 + Merge pull request #89 from rxin/executor + [Don't setup the uncaught exception handler in local mode.] + + 261bcf2 Sun Oct 20 17:59:51 2013 -0700 + Merge pull request #80 from rxin/build + [Exclusion rules for Maven build files.] + + edc5e3f Sun Oct 20 17:18:06 2013 -0700 + Merge pull request #75 from JoshRosen/block-manager-cleanup + [Code de-duplication in BlockManager] + + 2a7ae17 Sun Oct 20 11:45:21 2013 -0700 + Merge pull request #84 from rxin/kill1 + [Added documentation for setJobGroup. Also some minor cleanup in SparkContext.] + + e4abb75 Sun Oct 20 09:38:37 2013 -0700 + Merge pull request #85 from rxin/clean + [Moved the top level spark package object from spark to org.apache.spark] + + 136b9b3 Sun Oct 20 02:58:26 2013 -0700 + Basic shuffle file consolidation + [The Spark shuffle phase can produce a large number of files, as one file is created] + + 747f538 Sat Oct 19 23:40:40 2013 -0700 + Merge pull request #83 from ewencp/pyspark-accumulator-add-method + [Add an add() method to pyspark accumulators.] + + 6511bbe Sat Oct 19 11:34:56 2013 -0700 + Merge pull request #78 from mosharaf/master + [Removed BitTorrentBroadcast and TreeBroadcast.] + + f628804 Fri Oct 18 23:19:42 2013 -0700 + Merge pull request #76 from pwendell/master + [Clarify compression property.] + + 599dcb0 Fri Oct 18 22:49:00 2013 -0700 + Merge pull request #74 from rxin/kill + [Job cancellation via job group id.] + + 9cf43cf Fri Oct 18 22:07:21 2013 -0700 + Merge pull request #28 from jegonzal/VertexSetRDD + [Refactoring IndexedRDD to VertexSetRDD.] + + f888a5b Fri Oct 18 22:06:58 2013 -0700 + Merge pull request #29 from ankurdave/unit-tests + [Unit tests for Graph and GraphOps] + + 8de9706 Fri Oct 18 20:32:39 2013 -0700 + Merge pull request #66 from shivaram/sbt-assembly-deps + [Add SBT target to assemble dependencies] + + e5316d0 Fri Oct 18 20:30:56 2013 -0700 + Merge pull request #68 from mosharaf/master + [Faster and stable/reliable broadcast] + + 8d528af Fri Oct 18 20:24:10 2013 -0700 + Merge pull request #71 from aarondav/scdefaults + [Spark shell exits if it cannot create SparkContext] + + 0794bd7 Fri Oct 18 18:59:58 2013 -0700 + Merge pull request #27 from jegonzal/removed_indexedrdd_from_core + [Removing IndexedRDD changes for spark/core] + + 099977f Thu Oct 17 14:17:08 2013 -0700 + Merge pull request #26 from ankurdave/split-vTableReplicated + [Great work!] + + fc26e5b Thu Oct 17 13:21:07 2013 -0700 + Merge pull request #69 from KarthikTunga/master + [Fix for issue SPARK-627. Implementing --config argument in the scripts.] + + cf64f63 Thu Oct 17 11:12:28 2013 -0700 + Merge pull request #67 from kayousterhout/remove_tsl + [Removed TaskSchedulerListener interface.] + + f9973ca Wed Oct 16 15:58:41 2013 -0700 + Merge pull request #65 from tgravescs/fixYarn + [Fix yarn build] + + 28e9c2a Tue Oct 15 23:59:56 2013 -0700 + Merge pull request #63 from pwendell/master + [Fixing spark streaming example and a bug in examples build.] + + 4e46fde Tue Oct 15 23:14:27 2013 -0700 + Merge pull request #62 from harveyfeng/master + [Make TaskContext's stageId publicly accessible.] + + b534606 Tue Oct 15 21:25:03 2013 -0700 + Merge pull request #8 from vchekan/checkpoint-ttl-restore + [Serialize and restore spark.cleaner.ttl to savepoint] + + 6dbd220 Tue Oct 15 19:02:57 2013 -0700 + Merge pull request #34 from kayousterhout/rename + [Renamed StandaloneX to CoarseGrainedX.] + + 983b83f Tue Oct 15 19:02:46 2013 -0700 + Merge pull request #61 from kayousterhout/daemon_thread + [Unified daemon thread pools] + + 3249e0e Tue Oct 15 14:12:33 2013 -0700 + Merge pull request #59 from rxin/warning + [Bump up logging level to warning for failed tasks.] + + 678dec6 Tue Oct 15 10:51:46 2013 -0700 + Merge pull request #58 from hsaputra/update-pom-asf + [Update pom.xml to use version 13 of the ASF parent pom] + + e33b183 Mon Oct 14 22:25:47 2013 -0700 + Merge pull request #29 from rxin/kill + [Job killing] + + 3b11f43 Mon Oct 14 14:20:01 2013 -0700 + Merge pull request #57 from aarondav/bid + [Refactor BlockId into an actual type] + + 9979690 Sat Oct 12 21:23:26 2013 -0700 + Merge pull request #52 from harveyfeng/hadoop-closure + [Add an optional closure parameter to HadoopRDD instantiation to use when creating local JobConfs.] + + dca8009 Fri Oct 11 16:08:15 2013 -0700 + Merge pull request #54 from aoiwelle/remove_unused_imports + [Remove unnecessary mutable imports] + + 0e5052b Fri Oct 11 15:45:16 2013 -0700 + Merge pull request #51 from ScrapCodes/scala-2.10 + [Scala 2.10] + + fb25f32 Fri Oct 11 15:44:43 2013 -0700 + Merge pull request #53 from witgo/master + [Add a zookeeper compile dependency to fix build in maven] + + d6ead47 Fri Oct 11 15:43:01 2013 -0700 + Merge pull request #32 from mridulm/master + [Address review comments, move to incubator spark] + + c71499b Thu Oct 10 17:16:42 2013 -0700 + Merge pull request #19 from aarondav/master-zk + [Standalone Scheduler fault tolerance using ZooKeeper] + + 5867a82 Thu Oct 10 14:02:37 2013 -0700 + Merge pull request #19 from dcrankshaw/master + [Merge canonical 2d partitioner and group edges into benchmarks] + + cd08f73 Thu Oct 10 13:55:47 2013 -0700 + Merge pull request #44 from mateiz/fast-map + [A fast and low-memory append-only map for shuffle operations] + + 4b46d51 Thu Oct 10 13:35:36 2013 -0700 + Merge pull request #17 from amplab/product2 + [product 2 change] + + 320418f Wed Oct 9 16:55:30 2013 -0700 + Merge pull request #49 from mateiz/kryo-fix-2 + [Fix Chill serialization of Range objects] + + 215238c Wed Oct 9 16:49:44 2013 -0700 + Merge pull request #50 from kayousterhout/SPARK-908 + [Fix race condition in SparkListenerSuite (fixes SPARK-908).] + + 7827efc Wed Oct 9 15:07:25 2013 -0700 + Merge pull request #46 from mateiz/py-sort-update + [Fix PySpark docs and an overly long line of code after #38] + + 7b3ae04 Wed Oct 9 12:14:19 2013 -0700 + Merge pull request #45 from pwendell/metrics_units + [Use standard abbreviation in metrics description (MBytes -> MB)] + + b4fa11f Wed Oct 9 11:59:47 2013 -0700 + Merge pull request #38 from AndreSchumacher/pyspark_sorting + [SPARK-705: implement sortByKey() in PySpark] + + 19d445d Wed Oct 9 11:08:34 2013 -0700 + Merge pull request #22 from GraceH/metrics-naming + [SPARK-900 Use coarser grained naming for metrics] + + 7d50f9f Wed Oct 9 10:32:42 2013 -0700 + Merge pull request #35 from MartinWeindel/scala-2.10 + [Fixing inconsistencies and warnings on Scala 2.10 branch] + + 3218fa7 Tue Oct 8 23:44:55 2013 -0700 + Merge pull request #4 from MLnick/implicit-als + [Adding algorithm for implicit feedback data to ALS] + + e67d5b9 Tue Oct 8 22:57:38 2013 -0700 + Merge pull request #43 from mateiz/kryo-fix + [Don't allocate Kryo buffers unless needed] + + ea34c52 Mon Oct 7 20:45:58 2013 -0700 + Merge pull request #42 from pwendell/shuffle-read-perf + [Fix inconsistent and incorrect log messages in shuffle read path] + + 02f37ee Mon Oct 7 15:48:52 2013 -0700 + Merge pull request #39 from pwendell/master + [Adding Shark 0.7.1 to EC2 scripts] + + 213b70a Mon Oct 7 10:54:22 2013 -0700 + Merge pull request #31 from sundeepn/branch-0.8 + [Resolving package conflicts with hadoop 0.23.9] + + d585613 Sat Oct 5 22:57:05 2013 -0700 + Merge pull request #37 from pwendell/merge-0.8 + [merge in remaining changes from `branch-0.8`] + + 4a25b11 Sat Oct 5 19:28:55 2013 -0700 + Merge pull request #20 from harveyfeng/hadoop-config-cache + [Allow users to pass broadcasted Configurations and cache InputFormats across Hadoop file reads.] + + 8fc68d0 Sat Oct 5 17:24:35 2013 -0700 + Merge pull request #36 from pwendell/versions + [Bumping EC2 default version in master to .] + + 100222b Sat Oct 5 13:38:59 2013 -0700 + Merge pull request #27 from davidmccauley/master + [SPARK-920/921 - JSON endpoint updates] + + 0864193 Sat Oct 5 13:25:18 2013 -0700 + Merge pull request #33 from AndreSchumacher/pyspark_partition_key_change + [Fixing SPARK-602: PythonPartitioner] + + 61ffcde Fri Oct 4 10:52:17 2013 -0700 + Merge pull request #15 from dcrankshaw/master + [Add synthetic generators] + + 3fe12cc Fri Oct 4 10:51:28 2013 -0700 + Merge pull request #946 from ScrapCodes/scala-2.10 + [Fixed non termination of Executor backend, when sc.stop is not called and system.exit instead.] + + 232765f Thu Oct 3 12:00:48 2013 -0700 + Merge pull request #26 from Du-Li/master + [fixed a wildcard bug in make-distribution.sh; ask sbt to check local] + + 405e69b Thu Oct 3 10:52:41 2013 -0700 + Merge pull request #25 from CruncherBigData/master + [Update README: updated the link] + + 49dbfcc Thu Oct 3 10:52:06 2013 -0700 + Merge pull request #28 from tgravescs/sparYarnAppName + [Allow users to set the application name for Spark on Yarn] + + e597ea3 Wed Oct 2 21:14:24 2013 -0700 + Merge pull request #10 from kayousterhout/results_through-bm + [Send Task results through the block manager when larger than Akka frame size (fixes SPARK-669).] + + 714fdab Thu Sep 26 14:28:55 2013 -0700 + Merge pull request #17 from rxin/optimize + [Remove -optimize flag] + + 13eced7 Thu Sep 26 14:18:19 2013 -0700 + Merge pull request #16 from pwendell/master + [Bug fix in master build] + + 70a0b99 Thu Sep 26 14:11:54 2013 -0700 + Merge pull request #14 from kayousterhout/untangle_scheduler + [Improved organization of scheduling packages.] + + afd03b2 Thu Sep 26 14:09:55 2013 -0700 + Merge pull request #943 from ScrapCodes/scala-2.10 + [Scala 2.10 with akka 2.2] + + 76677b8 Thu Sep 26 14:03:46 2013 -0700 + Merge pull request #670 from jey/ec2-ssh-improvements + [EC2 SSH improvements] + + c514cd1 Thu Sep 26 13:48:20 2013 -0700 + Merge pull request #930 from holdenk/master + [Add mapPartitionsWithIndex] + + 560ee5c Thu Sep 26 11:27:34 2013 -0700 + Merge pull request #7 from wannabeast/memorystore-fixes + [some minor fixes to MemoryStore] + + 6566a19 Thu Sep 26 08:01:04 2013 -0700 + Merge pull request #9 from rxin/limit + [Smarter take/limit implementation.] + + 834686b Sun Sep 22 15:06:48 2013 -0700 + Merge pull request #928 from jerryshao/fairscheduler-refactor + [Refactor FairSchedulableBuilder] + + a2ea069 Sat Sep 21 23:04:42 2013 -0700 + Merge pull request #937 from jerryshao/localProperties-fix + [Fix PR926 local properties issues in Spark Streaming like scenarios] + + f06f2da Sat Sep 21 22:43:34 2013 -0700 + Merge pull request #941 from ilikerps/master + [Add "org.apache." prefix to packages in spark-class] + + 7bb12a2 Sat Sep 21 22:42:46 2013 -0700 + Merge pull request #940 from ankurdave/clear-port-properties-after-tests + [After unit tests, clear port properties unconditionally] + + a00317b Fri Sep 20 11:29:31 2013 -0700 + Merge pull request #1 from ankurdave/aggregateNeighbors-returns-graph + [Return Graph from Graph.aggregateNeighbors] + + 6a5e665 Thu Sep 19 22:41:44 2013 -0700 + Merge pull request #3 from ankurdave/clear-port-properties-after-tests + [After unit tests, clear port properties unconditionally ] + + 68ad33a Thu Sep 19 21:30:27 2013 -0700 + Merge pull request #2 from ankurdave/package-fixes + [Package fixes (spark.graph -> org.apache.spark.graph)] + + cd7222c Thu Sep 19 14:21:24 2013 -0700 + Merge pull request #938 from ilikerps/master + [Fix issue with spark_ec2 seeing empty security groups] + + e0dd24d Sat Aug 31 17:54:15 2013 -0700 + Merge pull request #879 from AndreSchumacher/scala-2.10 + [PySpark: replacing class manifest by class tag for Scala 2.10.2 in rdd.py] + + ad61349 Thu Jul 18 13:53:48 2013 -0700 + Merge pull request #709 from ScrapCodes/scala-2.10 + [Fixed warnings in scala 2.10 branch.] + + a289ded Mon Jul 15 15:59:43 2013 -0700 + Merge pull request #700 from ScrapCodes/scala-2.10 + [Scala 2.10 ] + + 1044a95 Fri Jun 14 20:04:24 2013 -0700 + Merge pull request #652 from ScrapCodes/scala-2.10 + [Fixed maven build without netty fix] + + 4b57f83 Sat Apr 20 10:40:07 2013 -0700 + Merge pull request #535 from ScrapCodes/scala-2.10-repl-port + [porting of repl to scala-2.10] + + 73b3fee Sun Jan 20 10:11:49 2013 -0800 + Merge pull request #388 from folone/master + [Updated maven build configuration for Scala 2.10] + + 20adf27 Tue Jan 15 11:03:49 2013 -0800 + Merge pull request #371 from folone/master + [Scala 2.10.0] + +Release 0.8.0-incubating + + 2aff798 Sun Sep 15 14:05:04 2013 -0700 + Merge pull request #933 from jey/yarn-typo-fix + [Fix typo in Maven build docs] + + dbd2c4f Sun Sep 15 13:20:41 2013 -0700 + Merge pull request #932 from pwendell/mesos-version + [Bumping Mesos version to 0.13.0] + + 9fb0b9d Sun Sep 15 13:02:53 2013 -0700 + Merge pull request #931 from pwendell/yarn-docs + [Explain yarn.version in Maven build docs] + + c4c1db2 Fri Sep 13 19:52:12 2013 -0700 + Merge pull request #929 from pwendell/master + [Use different Hadoop version for YARN artifacts.] + + a310de6 Wed Sep 11 19:36:11 2013 -0700 + Merge pull request #926 from kayousterhout/dynamic + [Changed localProperties to use ThreadLocal (not DynamicVariable).] + + 58c7d8b Wed Sep 11 17:33:42 2013 -0700 + Merge pull request #927 from benh/mesos-docs + [Updated Spark on Mesos documentation.] + + 91a59e6 Wed Sep 11 10:21:48 2013 -0700 + Merge pull request #919 from mateiz/jets3t + [Add explicit jets3t dependency, which is excluded in hadoop-client] + + b9128d3 Wed Sep 11 10:03:06 2013 -0700 + Merge pull request #922 from pwendell/port-change + [Change default port number from 3030 to 4030.] + + e07eef8 Wed Sep 11 07:35:39 2013 -0700 + Merge pull request #925 from davidmccauley/master + [SPARK-894 - Not all WebUI fields delivered VIA JSON] + + 8432f27 Tue Sep 10 23:19:53 2013 -0700 + Merge pull request #923 from haoyuan/master + [fix run-example script] + + d40f140 Tue Sep 10 23:05:29 2013 -0700 + Merge pull request #921 from pwendell/master + [Fix HDFS access bug with assembly build.] + + 0a6c051 Mon Sep 9 23:37:57 2013 -0700 + Merge pull request #918 from pwendell/branch-0.8 + [Update versions for 0.8.0 release.] + + 8c14f4b Mon Sep 9 22:07:58 2013 -0700 + Merge pull request #917 from pwendell/master + [Document libgfortran dependency for MLBase] + + c81377b Mon Sep 9 20:16:19 2013 -0700 + Merge pull request #915 from ooyala/master + [Get rid of / improve ugly NPE when Utils.deleteRecursively() fails] + + 61d2a01 Mon Sep 9 18:21:01 2013 -0700 + Merge pull request #916 from mateiz/mkdist-fix + [Fix copy issue in https://github.com/mesos/spark/pull/899] + + a85758c Mon Sep 9 13:45:40 2013 -0700 + Merge pull request #907 from stephenh/document_coalesce_shuffle + [Add better docs for coalesce.] + + 084fc36 Mon Sep 9 12:01:35 2013 -0700 + Merge pull request #912 from tgravescs/ganglia-pom + [Add metrics-ganglia to core pom file] + + 0456384 Mon Sep 9 09:57:54 2013 -0700 + Merge pull request #911 from pwendell/ganglia-sink + [Adding Manen dependency for Ganglia] + + bf984e2 Sun Sep 8 23:50:24 2013 -0700 + Merge pull request #890 from mridulm/master + [Fix hash bug] + + e9d4f44 Sun Sep 8 23:36:48 2013 -0700 + Merge pull request #909 from mateiz/exec-id-fix + [Fix an instance where full standalone mode executor IDs were passed to] + + 2447b1c Sun Sep 8 22:27:49 2013 -0700 + Merge pull request #910 from mateiz/ml-doc-tweaks + [Small tweaks to MLlib docs] + + 7d3204b Sun Sep 8 21:39:12 2013 -0700 + Merge pull request #905 from mateiz/docs2 + [Job scheduling and cluster mode docs] + + f1f8371 Sun Sep 8 21:26:11 2013 -0700 + Merge pull request #896 from atalwalkar/master + [updated content] + + f68848d Sun Sep 8 18:32:16 2013 -0700 + Merge pull request #906 from pwendell/ganglia-sink + [Clean-up of Metrics Code/Docs and Add Ganglia Sink] + + 0b95799 Sun Sep 8 15:30:16 2013 -0700 + Merge pull request #908 from pwendell/master + [Fix target JVM version in scala build] + + 04cfb3a Sun Sep 8 10:33:20 2013 -0700 + Merge pull request #898 from ilikerps/660 + [SPARK-660: Add StorageLevel support in Python] + + 38488ac Sun Sep 8 00:28:53 2013 -0700 + Merge pull request #900 from pwendell/cdh-docs + [Provide docs to describe running on CDH/HDP cluster.] + + a8e376e Sat Sep 7 21:16:01 2013 -0700 + Merge pull request #904 from pwendell/master + [Adding Apache license to two files] + + cfde85e Sat Sep 7 13:53:08 2013 -0700 + Merge pull request #901 from ooyala/2013-09/0.8-doc-changes + [0.8 Doc changes for make-distribution.sh] + + 4a7813a Sat Sep 7 13:52:24 2013 -0700 + Merge pull request #903 from rxin/resulttask + [Fixed the bug that ResultTask was not properly deserializing outputId.] + + afe46ba Sat Sep 7 07:28:51 2013 -0700 + Merge pull request #892 from jey/fix-yarn-assembly + [YARN build fixes] + + 2eebeff Fri Sep 6 15:25:22 2013 -0700 + Merge pull request #897 from pwendell/master + [Docs describing Spark monitoring and instrumentation] + + ddcb9d3 Thu Sep 5 23:54:09 2013 -0700 + Merge pull request #895 from ilikerps/821 + [SPARK-821: Don't cache results when action run locally on driver] + + 699c331 Thu Sep 5 20:21:53 2013 -0700 + Merge pull request #891 from xiajunluan/SPARK-864 + [[SPARK-864]DAGScheduler Exception if we delete Worker and StandaloneExecutorBackend then add Worker] + + 5c7494d Wed Sep 4 22:47:03 2013 -0700 + Merge pull request #893 from ilikerps/master + [SPARK-884: Add unit test to validate Spark JSON output] + + a547866 Wed Sep 4 21:11:56 2013 -0700 + Merge pull request #894 from c0s/master + [Updating assembly README to reflect recent changes in the build.] + + 19f7027 Tue Sep 3 14:29:10 2013 -0700 + Merge pull request #878 from tgravescs/yarnUILink + [Link the Spark UI up to the Yarn UI ] + + 68df246 Tue Sep 3 13:01:17 2013 -0700 + Merge pull request #889 from alig/master + [Return the port the WebUI is bound to (useful if port 0 was used)] + + d3dd48f Mon Sep 2 16:44:54 2013 -0700 + Merge pull request #887 from mateiz/misc-fixes + [Miscellaneous fixes for 0.8] + + 636fc0c Mon Sep 2 11:20:39 2013 -0700 + Merge pull request #886 from mateiz/codec + [Fix spark.io.compression.codec and change default codec to LZF] + + d9a53b9 Sun Sep 1 22:12:30 2013 -0700 + Merge pull request #885 from mateiz/win-py + [Allow PySpark to run on Windows] + + 3c520fe Sun Sep 1 17:26:55 2013 -0700 + Merge pull request #884 from mateiz/win-fixes + [Run script fixes for Windows after package & assembly change] + + f957c26 Sun Sep 1 14:53:57 2013 -0700 + Merge pull request #882 from mateiz/package-rename + [Rename spark package to org.apache.spark] + + a30fac1 Sun Sep 1 12:27:50 2013 -0700 + Merge pull request #883 from alig/master + [Don't require the spark home environment variable to be set for standalone mode (change needed by SIMR)] + + 03cc765 Sun Sep 1 10:20:56 2013 -0700 + Merge pull request #881 from pwendell/master + [Extend QuickStart to include next steps] + + 0e9565a Sat Aug 31 18:55:41 2013 -0700 + Merge pull request #880 from mateiz/ui-tweaks + [Various UI tweaks] + + 2b29a1d Sat Aug 31 17:49:45 2013 -0700 + Merge pull request #877 from mateiz/docs + [Doc improvements for 0.8] + + 6edef9c Sat Aug 31 13:39:24 2013 -0700 + Merge pull request #861 from AndreSchumacher/pyspark_sampling_function + [Pyspark sampling function] + + fd89835 Sat Aug 31 13:18:12 2013 -0700 + Merge pull request #870 from JoshRosen/spark-885 + [Don't send SIGINT / ctrl-c to Py4J gateway subprocess] + + 618f0ec Fri Aug 30 18:17:13 2013 -0700 + Merge pull request #869 from AndreSchumacher/subtract + [PySpark: implementing subtractByKey(), subtract() and keyBy()] + + 94bb7fd Fri Aug 30 12:05:13 2013 -0700 + Merge pull request #876 from mbautin/master_hadoop_rdd_conf + [Make HadoopRDD's configuration accessible] + + 9e17e45 Fri Aug 30 00:22:53 2013 -0700 + Merge pull request #875 from shivaram/build-fix + [Fix broken build by removing addIntercept] + + 016787d Thu Aug 29 22:15:14 2013 -0700 + Merge pull request #863 from shivaram/etrain-ridge + [Adding linear regression and refactoring Ridge regression to use SGD] + + 852d810 Thu Aug 29 22:13:15 2013 -0700 + Merge pull request #819 from shivaram/sgd-cleanup + [Change SVM to use {0,1} labels] + + ca71620 Thu Aug 29 21:51:14 2013 -0700 + Merge pull request #857 from mateiz/assembly + [Change build and run instructions to use assemblies] + + 1528776 Thu Aug 29 21:30:47 2013 -0700 + Merge pull request #874 from jerryshao/fix-report-bug + [Fix removed block zero size log reporting] + + abdbacf Wed Aug 28 21:11:31 2013 -0700 + Merge pull request #871 from pwendell/expose-local + [Expose `isLocal` in SparkContext.] + + afcade3 Wed Aug 28 20:15:40 2013 -0700 + Merge pull request #873 from pwendell/master + [Hot fix for command runner] + + baa84e7 Wed Aug 28 12:44:46 2013 -0700 + Merge pull request #865 from tgravescs/fixtmpdir + [Spark on Yarn should use yarn approved directories for spark.local.dir and tmp] + + cd043cf Tue Aug 27 19:50:32 2013 -0700 + Merge pull request #867 from tgravescs/yarnenvconfigs + [Spark on Yarn allow users to specify environment variables ] + + 898da7e Mon Aug 26 20:40:49 2013 -0700 + Merge pull request #859 from ianbuss/sbt_opts + [Pass SBT_OPTS environment through to sbt_launcher] + + 17bafea Mon Aug 26 11:59:32 2013 -0700 + Merge pull request #864 from rxin/json1 + [Revert json library change] + + f9fc5c1 Sat Aug 24 15:19:56 2013 -0700 + Merge pull request #603 from pwendell/ec2-updates + [Several Improvements to EC2 Scripts] + + d282c1e Fri Aug 23 11:20:20 2013 -0700 + Merge pull request #860 from jey/sbt-ide-fixes + [Fix IDE project generation under SBT] + + 5a6ac12 Thu Aug 22 22:08:03 2013 -0700 + Merge pull request #701 from ScrapCodes/documentation-suggestions + [Documentation suggestions for spark streaming.] + + 46ea0c1 Thu Aug 22 15:57:28 2013 -0700 + Merge pull request #814 from holdenk/master + [Create less instances of the random class during ALS initialization.] + + 9ac3d62 Thu Aug 22 15:51:10 2013 -0700 + Merge pull request #856 from jey/sbt-fix-hadoop-0.23.9 + [Re-add removed dependency to fix build under Hadoop 0.23.9] + + ae8ba83 Thu Aug 22 10:14:54 2013 -0700 + Merge pull request #855 from jey/update-build-docs + [Update build docs] + + 8a36fd0 Thu Aug 22 10:13:35 2013 -0700 + Merge pull request #854 from markhamstra/pomUpdate + [Synced sbt and maven builds to use the same dependencies, etc.] + + c2d00f1 Thu Aug 22 10:13:03 2013 -0700 + Merge pull request #832 from alig/coalesce + [Coalesced RDD with locality] + + e6d66c8 Wed Aug 21 17:44:31 2013 -0700 + Merge pull request #853 from AndreSchumacher/double_rdd + [Implementing SPARK-838: Add DoubleRDDFunctions methods to PySpark] + + 2905611 Tue Aug 20 17:36:14 2013 -0700 + Merge pull request #851 from markhamstra/MutablePairTE + [Removed meaningless types] + + d61337f Tue Aug 20 10:06:06 2013 -0700 + Merge pull request #844 from markhamstra/priorityRename + [Renamed 'priority' to 'jobId' and assorted minor changes] + + 8cae72e Mon Aug 19 23:40:04 2013 -0700 + Merge pull request #828 from mateiz/sched-improvements + [Scheduler fixes and improvements] + + efeb142 Mon Aug 19 19:23:50 2013 -0700 + Merge pull request #849 from mateiz/web-fixes + [Small fixes to web UI] + + abdc1f8 Mon Aug 19 18:30:56 2013 -0700 + Merge pull request #847 from rxin/rdd + [Allow subclasses of Product2 in all key-value related classes] + + 8fa0747 Sun Aug 18 17:02:54 2013 -0700 + Merge pull request #840 from AndreSchumacher/zipegg + [Implementing SPARK-878 for PySpark: adding zip and egg files to context ...] + + 1e137a5 Sat Aug 17 22:22:32 2013 -0700 + Merge pull request #846 from rxin/rdd + [Two minor RDD refactoring] + + e89ffc7 Fri Aug 16 14:02:34 2013 -0700 + Merge pull request #839 from jegonzal/zip_partitions + [Currying RDD.zipPartitions ] + + 1fb1b09 Thu Aug 15 22:15:05 2013 -0700 + Merge pull request #841 from rxin/json + [Use the JSON formatter from Scala library and removed dependency on lift-json.] + + c69c489 Thu Aug 15 20:55:09 2013 -0700 + Merge pull request #843 from Reinvigorate/bug-879 + [fixing typo in conf/slaves] + + 230ab27 Thu Aug 15 17:45:17 2013 -0700 + Merge pull request #834 from Daemoen/master + [Updated json output to allow for display of worker state] + + 659553b Thu Aug 15 16:56:31 2013 -0700 + Merge pull request #836 from pwendell/rename + [Rename `memoryBytesToString` and `memoryMegabytesToString`] + + 28369ff Thu Aug 15 16:44:02 2013 -0700 + Merge pull request #829 from JoshRosen/pyspark-unit-tests-python-2.6 + [Fix PySpark unit tests on Python 2.6] + + 1a13460 Thu Aug 15 15:50:44 2013 -0700 + Merge pull request #833 from rxin/ui + [Various UI improvements.] + + 044a088 Wed Aug 14 20:43:49 2013 -0700 + Merge pull request #831 from rxin/scheduler + [A few small scheduler / job description changes.] + + 839f2d4 Wed Aug 14 16:17:23 2013 -0700 + Merge pull request #822 from pwendell/ui-features + [Adding GC Stats to TaskMetrics (and three small fixes)] + + 63446f9 Wed Aug 14 00:17:07 2013 -0700 + Merge pull request #826 from kayousterhout/ui_fix + [Fixed 2 bugs in executor UI (incl. SPARK-877)] + + 3f14cba Tue Aug 13 20:09:51 2013 -0700 + Merge pull request #825 from shivaram/maven-repl-fix + [Set SPARK_CLASSPATH for maven repl tests] + + 596adc6 Tue Aug 13 19:41:34 2013 -0700 + Merge pull request #824 from mateiz/mesos-0.12.1 + [Update to Mesos 0.12.1] + + d316af9 Tue Aug 13 15:31:01 2013 -0700 + Merge pull request #821 from pwendell/print-launch-command + [Print run command to stderr rather than stdout] + + 1f79d21 Tue Aug 13 15:23:54 2013 -0700 + Merge pull request #818 from kayousterhout/killed_fix + [Properly account for killed tasks.] + + 622f83c Tue Aug 13 09:58:52 2013 -0700 + Merge pull request #817 from pwendell/pr_784 + [Minor clean-up in metrics servlet code] + + a0133bf Tue Aug 13 09:28:18 2013 -0700 + Merge pull request #784 from jerryshao/dev-metrics-servlet + [Add MetricsServlet for Spark metrics system] + + e2fdac6 Mon Aug 12 21:26:59 2013 -0700 + Merge pull request #802 from stayhf/SPARK-760-Python + [Simple PageRank algorithm implementation in Python for SPARK-760] + + d3525ba Mon Aug 12 21:02:39 2013 -0700 + Merge pull request #813 from AndreSchumacher/add_files_pyspark + [Implementing SPARK-865: Add the equivalent of ADD_JARS to PySpark] + + 9e02da2 Mon Aug 12 20:22:27 2013 -0700 + Merge pull request #812 from shivaram/maven-mllib-tests + [Create SparkContext in beforeAll for MLLib tests] + + 65d0d91 Mon Aug 12 19:00:57 2013 -0700 + Merge pull request #807 from JoshRosen/guava-optional + [Change scala.Option to Guava Optional in Java APIs] + + 4346f0a Mon Aug 12 12:12:12 2013 -0700 + Merge pull request #809 from shivaram/sgd-cleanup + [Clean up scaladoc in ML Lib.] + + ea1b4ba Mon Aug 12 08:09:58 2013 -0700 + Merge pull request #806 from apivovarov/yarn-205 + [Changed yarn.version to 2.0.5 in pom.xml] + + 2a39d2c Sun Aug 11 20:35:09 2013 -0700 + Merge pull request #810 from pwendell/dead_doc_code + [Remove now dead code inside of docs] + + e5b9ed2 Sun Aug 11 17:22:47 2013 -0700 + Merge pull request #808 from pwendell/ui_compressed_bytes + [Report compressed bytes read when calculating TaskMetrics] + + 3796486 Sun Aug 11 14:51:47 2013 -0700 + Merge pull request #805 from woggle/hadoop-rdd-jobconf + [Use new Configuration() instead of slower new JobConf() in SerializableWritable] + + ff9ebfa Sun Aug 11 10:52:55 2013 -0700 + Merge pull request #762 from shivaram/sgd-cleanup + [Refactor SGD options into a new class.] + + 95c62ca Sun Aug 11 10:30:52 2013 -0700 + Merge pull request #804 from apivovarov/master + [Fixed path to JavaALS.java and JavaKMeans.java, fixed hadoop2-yarn profi...] + + 06e4f2a Sat Aug 10 18:06:23 2013 -0700 + Merge pull request #789 from MLnick/master + [Adding Scala version of PageRank example] + + 71c63de Sat Aug 10 10:21:20 2013 -0700 + Merge pull request #795 from mridulm/master + [Fix bug reported in PR 791 : a race condition in ConnectionManager and Connection] + + d17eeb9 Sat Aug 10 09:02:27 2013 -0700 + Merge pull request #785 from anfeng/master + [expose HDFS file system stats via Executor metrics] + + dce5e47 Fri Aug 9 21:53:45 2013 -0700 + Merge pull request #800 from dlyubimov/HBASE_VERSION + [Pull HBASE_VERSION in the head of sbt build] + + cd247ba Fri Aug 9 20:41:13 2013 -0700 + Merge pull request #786 from shivaram/mllib-java + [Java fixes, tests and examples for ALS, KMeans] + + b09d4b7 Fri Aug 9 13:17:08 2013 -0700 + Merge pull request #799 from woggle/sync-fix + [Remove extra synchronization in ResultTask] + + 0bc63bf Fri Aug 9 13:16:25 2013 -0700 + Merge pull request #801 from pwendell/print-launch-command + [Print launch command [Branch 0.8 version]] + + cc6b92e Fri Aug 9 13:00:33 2013 -0700 + Merge pull request #775 from pwendell/print-launch-command + [Log the launch command for Spark daemons] + + f94fc75 Fri Aug 9 10:04:03 2013 -0700 + Merge pull request #788 from shane-huang/sparkjavaopts + [For standalone mode, add worker local env setting of SPARK_JAVA_OPTS as ...] + + 63b6e02 Thu Aug 8 14:02:02 2013 -0700 + Merge pull request #797 from mateiz/chill-0.3.1 + [Update to Chill 0.3.1] + + 9955e5a Thu Aug 8 11:03:38 2013 -0700 + Merge pull request #796 from pwendell/bootstrap-design + [Bootstrap re-design] + + 5133e4b Wed Aug 7 15:50:45 2013 -0700 + Merge pull request #790 from kayousterhout/fix_throughput + [Fixed issue in UI that decreased scheduler throughput by 5x or more] + + 3c8478e Tue Aug 6 23:25:03 2013 -0700 + Merge pull request #747 from mateiz/improved-lr + [Update the Python logistic regression example] + + 6b043a6 Tue Aug 6 22:31:02 2013 -0700 + Merge pull request #724 from dlyubimov/SPARK-826 + [SPARK-826: fold(), reduce(), collect() always attempt to use java serialization] + + de6c4c9 Tue Aug 6 17:09:50 2013 -0700 + Merge pull request #787 from ash211/master + [Update spark-standalone.md] + + df4d10d Tue Aug 6 15:44:05 2013 -0700 + Merge pull request #779 from adatao/adatao-global-SparkEnv + [[HOTFIX] Extend thread safety for SparkEnv.get()] + + d2b0f0c Tue Aug 6 14:49:39 2013 -0700 + Merge pull request #770 from stayhf/SPARK-760-Java + [Simple PageRank algorithm implementation in Java for SPARK-760] + + d031f73 Mon Aug 5 22:33:00 2013 -0700 + Merge pull request #782 from WANdisco/master + [SHARK-94 Log the files computed by HadoopRDD and NewHadoopRDD] + + 1b63dea Mon Aug 5 22:21:26 2013 -0700 + Merge pull request #769 from markhamstra/NegativeCores + [SPARK-847 + SPARK-845: Zombie workers and negative cores] + + 828aff7 Mon Aug 5 21:37:33 2013 -0700 + Merge pull request #776 from gingsmith/master + [adding matrix factorization data generator] + + 8b27789 Mon Aug 5 19:14:52 2013 -0700 + Merge pull request #774 from pwendell/job-description + [Show user-defined job name in UI] + + 550b0cf Mon Aug 5 12:10:32 2013 -0700 + Merge pull request #780 from cybermaster/master + [SPARK-850] + + 22abbc1 Fri Aug 2 16:37:59 2013 -0700 + Merge pull request #772 from karenfeng/ui-843 + [Show app duration] + + 9d7dfd2 Thu Aug 1 17:41:58 2013 -0700 + Merge pull request #743 from pwendell/app-metrics + [Add application metrics to standalone master] + + 6d7afd7 Thu Aug 1 17:13:28 2013 -0700 + Merge pull request #768 from pwendell/pr-695 + [Minor clean-up of fair scheduler UI] + + 5e7b38f Thu Aug 1 14:59:33 2013 -0700 + Merge pull request #695 from xiajunluan/pool_ui + [Enhance job ui in spark ui system with adding pool information] + + 0a96493 Thu Aug 1 11:27:17 2013 -0700 + Merge pull request #760 from karenfeng/heading-update + [Clean up web UI page headers] + + cb7dd86 Thu Aug 1 11:06:10 2013 -0700 + Merge pull request #758 from pwendell/master-json + [Add JSON path to master index page] + + 58756b7 Wed Jul 31 23:45:41 2013 -0700 + Merge pull request #761 from mateiz/kmeans-generator + [Add data generator for K-means] + + ecab635 Wed Jul 31 18:16:55 2013 -0700 + Merge pull request #763 from c0s/assembly + [SPARK-842. Maven assembly is including examples libs and dependencies] + + 39c75f3 Wed Jul 31 15:52:36 2013 -0700 + Merge pull request #757 from BlackNiuza/result_task_generation + [Bug fix: SPARK-837] + + b2b86c2 Wed Jul 31 15:51:39 2013 -0700 + Merge pull request #753 from shivaram/glm-refactor + [Build changes for ML lib] + + 14bf2fe Wed Jul 31 14:18:16 2013 -0700 + Merge pull request #749 from benh/spark-executor-uri + [Added property 'spark.executor.uri' for launching on Mesos.] + + 4ba4c3f Wed Jul 31 13:14:49 2013 -0700 + Merge pull request #759 from mateiz/split-fix + [Use the Char version of split() instead of the String one in MLUtils] + + a386ced Wed Jul 31 11:22:50 2013 -0700 + Merge pull request #754 from rxin/compression + [Compression codec change] + + 0be071a Wed Jul 31 11:11:59 2013 -0700 + Merge pull request #756 from cdshines/patch-1 + [Refactored Vector.apply(length, initializer) replacing excessive code with library method] + + d4556f4 Wed Jul 31 08:48:14 2013 -0700 + Merge pull request #751 from cdshines/master + [Cleaned Partitioner & PythonPartitioner source by taking out non-related logic to Utils] + + 29b8cd3 Tue Jul 30 21:30:33 2013 -0700 + Merge pull request #755 from jerryshao/add-apache-header + [Add Apache license header to metrics system] + + e87de03 Tue Jul 30 15:00:08 2013 -0700 + Merge pull request #744 from karenfeng/bootstrap-update + [Use Bootstrap progress bars in web UI] + + ae57020 Tue Jul 30 14:56:41 2013 -0700 + Merge pull request #752 from rxin/master + [Minor mllib cleanup] + + 8aee118 Tue Jul 30 10:27:54 2013 -0700 + Merge pull request #748 from atalwalkar/master + [made SimpleUpdater consistent with other updaters] + + 468a36c Mon Jul 29 19:44:33 2013 -0700 + Merge pull request #746 from rxin/cleanup + [Internal cleanup] + + 1e1ffb1 Mon Jul 29 19:26:19 2013 -0700 + Merge pull request #745 from shivaram/loss-update-fix + [Remove duplicate loss history in Gradient Descent] + + c99b674 Mon Jul 29 16:32:55 2013 -0700 + Merge pull request #735 from karenfeng/ui-807 + [Totals for shuffle data and CPU time] + + fe7298b Mon Jul 29 14:01:00 2013 -0700 + Merge pull request #741 from pwendell/usability + [Fix two small usability issues] + + c34c0f6 Mon Jul 29 13:18:10 2013 -0700 + Merge pull request #731 from pxinghao/master + [Adding SVM and Lasso] + + f3d72ff Fri Jul 26 17:19:27 2013 -0700 + Merge pull request #739 from markhamstra/toolsPom + [Missing tools/pom.xml scalatest dependency] + + cb36677 Fri Jul 26 16:59:30 2013 -0700 + Merge pull request #738 from harsha2010/pruning + [Fix bug in Partition Pruning.] + + f3cf094 Thu Jul 25 14:53:21 2013 -0700 + Merge pull request #734 from woggle/executor-env2 + [Get more env vars from driver rather than worker] + + 51c2427 Thu Jul 25 00:03:11 2013 -0700 + Merge pull request #732 from ryanlecompte/master + [Refactor Kryo serializer support to use chill/chill-java] + + 52723b9 Wed Jul 24 14:33:02 2013 -0700 + Merge pull request #728 from jey/examples-jar-env + [Fix setting of SPARK_EXAMPLES_JAR] + + 20338c2 Wed Jul 24 14:32:24 2013 -0700 + Merge pull request #729 from karenfeng/ui-811 + [Stage Page updates] + + 5584ebc Wed Jul 24 11:46:46 2013 -0700 + Merge pull request #675 from c0s/assembly + [Building spark assembly for further consumption of the Spark project with a deployed cluster] + + a73f3ee Wed Jul 24 08:59:14 2013 -0700 + Merge pull request #671 from jerryshao/master + [Add metrics system for Spark] + + b011329 Tue Jul 23 22:50:09 2013 -0700 + Merge pull request #727 from rxin/scheduler + [Scheduler code style cleanup.] + + 876125b Tue Jul 23 22:28:21 2013 -0700 + Merge pull request #726 from rxin/spark-826 + [SPARK-829: scheduler shouldn't hang if a task contains unserializable objects in its closure] + + 2f1736c Tue Jul 23 15:53:30 2013 -0700 + Merge pull request #725 from karenfeng/task-start + [Creates task start events] + + 5364f64 Tue Jul 23 13:40:34 2013 -0700 + Merge pull request #723 from rxin/mllib + [Made RegressionModel serializable and added unit tests to make sure predict methods would work.] + + f369e0e Tue Jul 23 13:22:27 2013 -0700 + Merge pull request #720 from ooyala/2013-07/persistent-rdds-api + [Add a public method getCachedRdds to SparkContext] + + 401aac8 Mon Jul 22 16:57:16 2013 -0700 + Merge pull request #719 from karenfeng/ui-808 + [Creates Executors tab for Jobs UI] + + 8ae1436 Mon Jul 22 16:03:04 2013 -0700 + Merge pull request #722 from JoshRosen/spark-825 + [Fix bug: DoubleRDDFunctions.sampleStdev() computed non-sample stdev()] + + 15fb394 Sun Jul 21 10:33:38 2013 -0700 + Merge pull request #716 from c0s/webui-port + [Regression: default webui-port can't be set via command line "--webui-port" anymore] + + c40f0f2 Fri Jul 19 13:33:04 2013 -0700 + Merge pull request #711 from shivaram/ml-generators + [Move ML lib data generator files to util/] + + 413b841 Fri Jul 19 13:31:38 2013 -0700 + Merge pull request #717 from viirya/dev1 + [Do not copy local jars given to SparkContext in yarn mode] + + 0d0a47c Thu Jul 18 12:06:37 2013 -0700 + Merge pull request #710 from shivaram/ml-updates + [Updates to LogisticRegression] + + c6235b5 Thu Jul 18 11:43:48 2013 -0700 + Merge pull request #714 from adatao/master + [[BUGFIX] Fix for sbt/sbt script SPARK_HOME setting] + + 009c79e Thu Jul 18 11:41:52 2013 -0700 + Merge pull request #715 from viirya/dev1 + [fix a bug in build process that pulls in two versions of ASM.] + + 985a9e3 Wed Jul 17 22:27:19 2013 -0700 + Merge pull request #712 from stayhf/SPARK-817 + [Consistently invoke bash with /usr/bin/env bash in scripts to make code ...] + + cad48ed Tue Jul 16 21:41:28 2013 -0700 + Merge pull request #708 from ScrapCodes/dependencies-upgrade + [Dependency upgrade Akka 2.0.3 -> 2.0.5] + + 8a8a8f2 Mon Jul 15 23:09:21 2013 -0700 + Merge pull request #705 from rxin/errormessages + [Throw a more meaningful message when runJob is called to launch tasks on non-existent partitions.] + + ed8415b Mon Jul 15 16:41:04 2013 -0700 + Merge pull request #703 from karenfeng/ui-802 + [Link to job UI from standalone deploy cluster web UI] + + e3d3e6f Mon Jul 15 14:59:44 2013 -0700 + Merge pull request #702 from karenfeng/ui-fixes + [Adds app name in HTML page titles on job web UI] + + c7877d5 Sun Jul 14 12:58:13 2013 -0700 + Merge pull request #689 from BlackNiuza/application_status + [Bug fix: SPARK-796] + + 10c0593 Sun Jul 14 11:45:18 2013 -0700 + Merge pull request #699 from pwendell/ui-env + [Add `Environment` tab to SparkUI.] + + 89e8549 Sat Jul 13 16:11:08 2013 -0700 + Merge pull request #698 from Reinvigorate/sm-deps-change + [changing com.google.code.findbugs maven coordinates] + + 77c69ae Fri Jul 12 23:05:21 2013 -0700 + Merge pull request #697 from pwendell/block-locations + [Show block locations in Web UI.] + + 5a7835c Fri Jul 12 20:28:21 2013 -0700 + Merge pull request #691 from karenfeng/logpaging + [Create log pages] + + 71ccca0 Fri Jul 12 20:25:06 2013 -0700 + Merge pull request #696 from woggle/executor-env + [Pass executor env vars (e.g. SPARK_CLASSPATH) to compute-classpath.sh] + + 90fc3f3 Fri Jul 12 20:23:36 2013 -0700 + Merge pull request #692 from Reinvigorate/takeOrdered + [adding takeOrdered() to RDD] + + 018d04c Thu Jul 11 12:48:37 2013 -0700 + Merge pull request #684 from woggle/mesos-classloader + [Explicitly set class loader for MesosSchedulerDriver callbacks.] + + bc19477 Wed Jul 10 22:29:41 2013 -0700 + Merge pull request #693 from c0s/readme + [Updating README to reflect Scala 2.9.3 requirements] + + 7dcda9a Mon Jul 8 23:24:23 2013 -0700 + Merge pull request #688 from markhamstra/scalaDependencies + [Fixed SPARK-795 with explicit dependencies] + + 638927b Mon Jul 8 22:58:50 2013 -0700 + Merge pull request #683 from shivaram/sbt-test-fix + [Remove some stack traces from sbt test output] + + 3c13178 Mon Jul 8 14:50:34 2013 -0700 + Merge pull request #687 from atalwalkar/master + [Added "Labeled" to util functions for labeled data] + + 744da8e Sun Jul 7 17:42:25 2013 -0700 + Merge pull request #679 from ryanlecompte/master + [Make binSearch method tail-recursive for RidgeRegression] + + 3cc6818 Sat Jul 6 19:51:20 2013 -0700 + Merge pull request #668 from shimingfei/guava-14.0.1 + [update guava version from 11.0.1 to 14.0.1] + + 2216188 Sat Jul 6 16:18:15 2013 -0700 + Merge pull request #676 from c0s/asf-avro + [Use standard ASF published avro module instead of a proprietory built one] + + 94871e4 Sat Jul 6 15:26:19 2013 -0700 + Merge pull request #655 from tgravescs/master + [Add support for running Spark on Yarn on a secure Hadoop Cluster] + + 3f918b3 Sat Jul 6 12:45:18 2013 -0700 + Merge pull request #672 from holdenk/master + [s/ActorSystemImpl/ExtendedActorSystem/ as ActorSystemImpl results in a warning] + + 2a36e54 Sat Jul 6 12:43:21 2013 -0700 + Merge pull request #673 from xiajunluan/master + [Add config template file for fair scheduler feature] + + 7ba7fa1 Sat Jul 6 11:45:08 2013 -0700 + Merge pull request #674 from liancheng/master + [Bug fix: SPARK-789] + + f4416a1 Sat Jul 6 11:41:58 2013 -0700 + Merge pull request #681 from BlackNiuza/memory_leak + [Remove active job from idToActiveJob when job finished or aborted] + + e063e29 Fri Jul 5 21:54:52 2013 -0700 + Merge pull request #680 from tdas/master + [Fixed major performance bug in Network Receiver] + + bf1311e Fri Jul 5 17:32:44 2013 -0700 + Merge pull request #678 from mateiz/ml-examples + [Start of ML package] + + 6ad85d0 Thu Jul 4 21:32:29 2013 -0700 + Merge pull request #677 from jerryshao/fix_stage_clean + [Clean StageToInfos periodically when spark.cleaner.ttl is enabled] + + 2e32fc8 Thu Jul 4 12:18:20 2013 -0700 + Merge pull request #666 from c0s/master + [hbase dependency is missed in hadoop2-yarn profile of examples module +] + + 6d60fe5 Mon Jul 1 18:24:03 2013 -0700 + Merge pull request #666 from c0s/master + [hbase dependency is missed in hadoop2-yarn profile of examples module] + + ccfe953 Sat Jun 29 17:57:53 2013 -0700 + Merge pull request #577 from skumargithub/master + [Example of cumulative counting using updateStateByKey] + + 50ca176 Thu Jun 27 22:24:52 2013 -0700 + Merge pull request #664 from pwendell/test-fix + [Removing incorrect test statement] + + e49bc8c Wed Jun 26 11:13:33 2013 -0700 + Merge pull request #663 from stephenh/option_and_getenv + [Be cute with Option and getenv.] + + f5e32ed Tue Jun 25 09:16:57 2013 -0700 + Merge pull request #661 from mesos/streaming + [Kafka fixes and DStream.count fix for master] + + 1249e91 Mon Jun 24 21:46:33 2013 -0700 + Merge pull request #572 from Reinvigorate/sm-block-interval + [Adding spark.streaming.blockInterval property] + + cfcda95 Mon Jun 24 21:44:50 2013 -0700 + Merge pull request #571 from Reinvigorate/sm-kafka-serializers + [Surfacing decoders on KafkaInputDStream] + + 575aff6 Mon Jun 24 21:35:50 2013 -0700 + Merge pull request #567 from Reinvigorate/sm-count-fix + [Fixing count() in Spark Streaming] + + 3e61bef Sat Jun 22 16:22:47 2013 -0700 + Merge pull request #648 from shivaram/netty-dbg + [Shuffle fixes and cleanup] + + 1ef5d0d Sat Jun 22 09:35:57 2013 -0700 + Merge pull request #644 from shimingfei/joblogger + [add Joblogger to Spark (on new Spark code)] + + 7e4b266 Sat Jun 22 07:53:18 2013 -0700 + Merge pull request #563 from jey/python-optimization + [Optimize PySpark worker invocation] + + 71030ba Wed Jun 19 15:21:03 2013 -0700 + Merge pull request #654 from lyogavin/enhance_pipe + [fix typo and coding style in #638] + + 73f4c7d Tue Jun 18 04:21:17 2013 -0700 + Merge pull request #605 from esjewett/SPARK-699 + [Add hBase example (retry of pull request #596)] + + 9933836 Tue Jun 18 02:41:10 2013 -0700 + Merge pull request #647 from jerryshao/master + [Reduce ZippedPartitionsRDD's getPreferredLocations complexity from O(2^2n) to O(2^n)] + + db42451 Mon Jun 17 15:26:36 2013 -0700 + Merge pull request #643 from adatao/master + [Bug fix: Zero-length partitions result in NaN for overall mean & variance] + + e82a2ff Mon Jun 17 15:13:15 2013 -0700 + Merge pull request #653 from rxin/logging + [SPARK-781: Log the temp directory path when Spark says "Failed to create temp directory."] + + e6d1277 Mon Jun 17 12:56:25 2013 -0700 + Merge pull request #638 from lyogavin/enhance_pipe + [Enhance pipe to support more features we can do in hadoop streaming] + + f961aac Sat Jun 15 00:53:41 2013 -0700 + Merge pull request #649 from ryanlecompte/master + [Add top K method to RDD using a bounded priority queue] + + 6602d94 Fri Jun 14 10:41:31 2013 -0700 + Merge pull request #651 from rxin/groupbykey + [SPARK-772 / SPARK-774: groupByKey and cogroup should disable map side combine] + + d93851a Thu Jun 13 13:38:45 2013 -0700 + Merge pull request #645 from pwendell/compression + [Adding compression to Hadoop save functions] + + f1da591 Wed Jun 12 17:55:08 2013 -0700 + Merge pull request #646 from markhamstra/jvmArgs + [Fixed jvmArgs in maven build.] + + 0e94b73 Mon Jun 10 13:00:31 2013 -0700 + Merge pull request #625 from stephenh/fix-start-slave + [Fix start-slave not passing instance number to spark-daemon.] + + 74b91d5 Sat Jun 8 01:19:40 2013 -0700 + Merge pull request #629 from c0s/master + [Sometime Maven build runs out of PermGen space.] + + c8fc423 Fri Jun 7 22:43:18 2013 -0700 + Merge pull request #631 from jerryshao/master + [Fix block manager UI display issue when enable spark.cleaner.ttl] + + 1ae60bc Fri Jun 7 22:39:06 2013 -0700 + Merge pull request #634 from xiajunluan/master + [[Spark-753] Fix ClusterSchedulSuite unit test failed ] + + fff3728 Tue Jun 4 16:09:50 2013 -0700 + Merge pull request #640 from pwendell/timeout-update + [Fixing bug in BlockManager timeout] + + f420d4f Tue Jun 4 15:25:58 2013 -0700 + Merge pull request #639 from pwendell/timeout-update + [Bump akka and blockmanager timeouts to 60 seconds] + + 84530ba Fri May 31 17:06:13 2013 -0700 + Merge pull request #636 from rxin/unpersist + [Unpersist More block manager cleanup.] + + ef77bb7 Thu May 30 14:50:06 2013 -0700 + Merge pull request #627 from shivaram/master + [Netty and shuffle bug fixes] + + 8cb8178 Thu May 30 14:17:44 2013 -0700 + Merge pull request #628 from shivaram/zero-block-size + [Skip fetching zero-sized blocks in NIO.] + + 6ed7139 Wed May 29 10:14:22 2013 -0700 + Merge pull request #626 from stephenh/remove-add-if-no-port + [Remove unused addIfNoPort.] + + 41d230c Tue May 28 23:35:24 2013 -0700 + Merge pull request #611 from squito/classloader + [Use default classloaders for akka & deserializing task results] + + 3db1e17 Mon May 27 21:31:43 2013 -0700 + Merge pull request #620 from jerryshao/master + [Fix CheckpointRDD java.io.FileNotFoundException when calling getPreferredLocations] + + 3d4891d Sat May 25 23:38:05 2013 -0700 + Merge pull request #621 from JoshRosen/spark-613 + [Use ec2-metadata in start-slave.sh to detect if running on EC2] + + e8d4b6c Sat May 25 21:09:03 2013 -0700 + Merge pull request #529 from xiajunluan/master + [[SPARK-663]Implement Fair Scheduler in Spark Cluster Scheduler ] + + 9a3c344 Sat May 25 17:53:43 2013 -0700 + Merge pull request #624 from rxin/master + [NonJavaSerializableClass should not be Java serializable...] + + 24e41aa Fri May 24 16:48:52 2013 -0700 + Merge pull request #623 from rxin/master + [Automatically configure Netty port.] + + 69161f9 Fri May 24 14:42:13 2013 -0700 + Merge pull request #622 from rxin/master + [bug fix: Shuffle block iterator is ignoring the shuffle serializer setting.] + + dbbedfc Thu May 23 23:11:06 2013 -0700 + Merge pull request #616 from jey/maven-netty-exclusion + [Exclude old versions of Netty from Maven-based build] + + a2b0a79 Tue May 21 18:16:20 2013 -0700 + Merge pull request #619 from woggling/adjust-sampling + [Use ARRAY_SAMPLE_SIZE constant instead of hard-coded 100.0 in SizeEstimator] + + 66dac44 Tue May 21 11:41:42 2013 -0700 + Merge pull request #618 from woggling/dead-code-disttest + [DistributedSuite: remove dead code] + + 5912cc4 Fri May 17 19:58:40 2013 -0700 + Merge pull request #610 from JoshRosen/spark-747 + [Throw exception if TaskResult exceeds Akka frame size] + + 6c27c38 Thu May 16 17:33:56 2013 -0700 + Merge pull request #615 from rxin/build-fix + [Maven build fix & two other small changes] + + 2f576ab Wed May 15 18:06:24 2013 -0700 + Merge pull request #602 from rxin/shufflemerge + [Manual merge & cleanup of Shane's Shuffle Performance Optimization] + + 48c6f46 Wed May 15 10:47:19 2013 -0700 + Merge pull request #612 from ash211/patch-4 + [Docs: Mention spark shell's default for MASTER] + + 203d7b7 Wed May 15 00:47:20 2013 -0700 + Merge pull request #593 from squito/driver_ui_link + [Master UI has link to Application UI] + + 016ac86 Mon May 13 21:45:36 2013 -0700 + Merge pull request #601 from rxin/emptyrdd-master + [EmptyRDD (master branch 0.8)] + + 4b354e0 Mon May 13 17:39:19 2013 -0700 + Merge pull request #589 from mridulm/master + [Add support for instance local scheduling] + + 5dbc9b2 Sun May 12 11:03:10 2013 -0700 + Merge pull request #608 from pwendell/SPARK-738 + [SPARK-738: Spark should detect and wrap nonserializable exceptions] + + 63e1999 Fri May 10 13:54:03 2013 -0700 + Merge pull request #606 from markhamstra/foreachPartition_fix + [Actually use the cleaned closure in foreachPartition] + + 42bbe89 Wed May 8 22:30:31 2013 -0700 + Merge pull request #599 from JoshRosen/spark-670 + [Fix SPARK-670: EC2 'start' command should require -i option.] + + 0f1b7a0 Wed May 8 13:38:50 2013 -0700 + Merge pull request #596 from esjewett/master + [hBase example] + + 7af92f2 Sat May 4 22:29:17 2013 -0700 + Merge pull request #597 from JoshRosen/webui-fixes + [Two minor bug fixes for Spark Web UI] + + c74ce60 Sat May 4 22:26:35 2013 -0700 + Merge pull request #598 from rxin/blockmanager + [Fixed flaky unpersist test in DistributedSuite.] + + 3bf2c86 Fri May 3 18:27:30 2013 -0700 + Merge pull request #594 from shivaram/master + [Add zip partitions to Java API] + + 2484ad7 Fri May 3 17:08:55 2013 -0700 + Merge pull request #587 from rxin/blockmanager + [A set of shuffle map output related changes] + + 6fe9d4e Thu May 2 21:33:56 2013 -0700 + Merge pull request #592 from woggling/localdir-fix + [Don't accept generated local directory names that can't be created] + + 538ee75 Thu May 2 09:01:42 2013 -0700 + Merge pull request #581 from jerryshao/master + [fix [SPARK-740] block manage UI throws exception when enabling Spark Streaming] + + 9abcbcc Wed May 1 22:45:10 2013 -0700 + Merge pull request #591 from rxin/removerdd + [RDD.unpersist: probably the most desired feature of Spark] + + aa8fe1a Tue Apr 30 22:30:18 2013 -0700 + Merge pull request #586 from mridulm/master + [Pull request to address issues Reynold Xin reported] + + f708dda Tue Apr 30 07:51:40 2013 -0700 + Merge pull request #585 from pwendell/listener-perf + [[Fix SPARK-742] Task Metrics should not employ per-record timing by default] + + 68c07ea Sun Apr 28 20:19:33 2013 -0700 + Merge pull request #582 from shivaram/master + [Add zip partitions interface] + + f6ee9a8 Sun Apr 28 15:36:04 2013 -0700 + Merge pull request #583 from mridulm/master + [Fix issues with streaming test cases after yarn branch merge] + + cf54b82 Thu Apr 25 11:45:58 2013 -0700 + Merge pull request #580 from pwendell/quickstart + [SPARK-739 Have quickstart standlone job use README] + + 118a6c7 Wed Apr 24 08:42:30 2013 -0700 + Merge pull request #575 from mridulm/master + [Manual merge of yarn branch to trunk] + + 5d8a71c Tue Apr 16 19:48:02 2013 -0700 + Merge pull request #570 from jey/increase-codecache-size + [Increase ReservedCodeCacheSize for sbt] + + ec5e553 Sun Apr 14 08:20:13 2013 -0700 + Merge pull request #558 from ash211/patch-jackson-conflict + [Don't pull in old versions of Jackson via hadoop-core] + + c1c219e Sun Apr 14 08:11:23 2013 -0700 + Merge pull request #564 from maspotts/master + [Allow latest scala in PATH, with SCALA_HOME as override (instead of vice-versa)] + + 7c10b3e Fri Apr 12 20:55:22 2013 -0700 + Merge pull request #565 from andyk/master + [Update wording of section on RDD operations in quick start guide in docs] + + 077ae0a Thu Apr 11 19:34:14 2013 -0700 + Merge pull request #561 from ash211/patch-4 + [Add details when BlockManager heartbeats time out] + + c91ff8d Wed Apr 10 15:08:23 2013 -0700 + Merge pull request #560 from ash211/patch-3 + [Typos: cluser -> cluster] + + 7cd83bf Tue Apr 9 22:07:35 2013 -0700 + Merge pull request #559 from ash211/patch-example-whitespace + [Uniform whitespace across scala examples] + + 271a4f3 Tue Apr 9 22:04:52 2013 -0700 + Merge pull request #555 from holdenk/master + [Retry failed ssh commands in the ec2 python script.] + + 8ac9efb Tue Apr 9 13:50:50 2013 -0700 + Merge pull request #527 from Reinvigorate/sm-kafka-cleanup + [KafkaInputDStream fixes and improvements] + + eed54a2 Mon Apr 8 09:44:30 2013 -0700 + Merge pull request #553 from pwendell/akka-standalone + [SPARK-724 - Have Akka logging enabled by default for standalone daemons] + + b362df3 Sun Apr 7 17:17:52 2013 -0700 + Merge pull request #552 from MLnick/master + [Bumping version for Twitter Algebird to latest] + + 4b30190 Sun Apr 7 17:15:10 2013 -0700 + Merge pull request #554 from andyk/scala2.9.3 + [Fixes SPARK-723 - Update build to Scala 2.9.3] + + dfe98ca Tue Apr 2 19:24:12 2013 -0700 + Merge pull request #550 from erikvanoosten/master + [corrected Algebird example] + + b5d7830 Tue Apr 2 19:23:45 2013 -0700 + Merge pull request #551 from jey/python-bugfixes + [Python bugfixes] + + 2be2295 Sun Mar 31 18:09:14 2013 -0700 + Merge pull request #548 from markhamstra/getWritableClass_filter + [Fixed broken filter in getWritableClass[T]] + + 9831bc1 Fri Mar 29 22:16:22 2013 -0700 + Merge pull request #539 from cgrothaus/fix-webui-workdirpath + [Bugfix: WorkerWebUI must respect workDirPath from Worker] + + 3cc8ab6 Fri Mar 29 22:14:07 2013 -0700 + Merge pull request #541 from stephenh/shufflecoalesce + [Add a shuffle parameter to coalesce.] + + cad507a Fri Mar 29 22:13:12 2013 -0700 + Merge pull request #547 from jey/maven-streaming-tests-initialization-fix + [Move streaming test initialization into 'before' blocks] + + a98996d Fri Mar 29 22:12:15 2013 -0700 + Merge pull request #545 from ash211/patch-1 + [Don't use deprecated Application in example] + + 104c694 Fri Mar 29 22:11:50 2013 -0700 + Merge pull request #546 from ash211/patch-2 + [Update tuning.md] + + bc36ee4 Tue Mar 26 15:05:13 2013 -0700 + Merge pull request #543 from holdenk/master + [Re-enable deprecation warnings and fix deprecated warning.] + + b8949ca Sat Mar 23 07:19:34 2013 -0700 + Merge pull request #505 from stephenh/volatile + [Make Executor fields volatile since they're read from the thread pool.] + + fd53f2f Sat Mar 23 07:13:21 2013 -0700 + Merge pull request #510 from markhamstra/WithThing + [mapWith, flatMapWith and filterWith] + + 4c5efcf Wed Mar 20 19:29:23 2013 -0700 + Merge pull request #532 from andyk/master + [SPARK-715: Adds instructions for building with Maven to documentation] + + 3558849 Wed Mar 20 19:27:47 2013 -0700 + Merge pull request #538 from rxin/cogroup + [Added mapSideCombine flag to CoGroupedRDD. Added unit test for CoGroupedRDD.] + + ca4d083 Wed Mar 20 11:22:36 2013 -0700 + Merge pull request #528 from MLnick/java-examples + [[SPARK-707] Adding Java versions of Pi, LogQuery and K-Means examples] + + b812e6b Wed Mar 20 11:21:02 2013 -0700 + Merge pull request #526 from markhamstra/foldByKey + [Add foldByKey] + + 945d1e7 Tue Mar 19 21:59:06 2013 -0700 + Merge pull request #536 from sasurfer/master + [CoalescedRDD for many partitions] + + 1cbbe94 Tue Mar 19 21:34:34 2013 -0700 + Merge pull request #534 from stephenh/removetrycatch + [Remove try/catch block that can't be hit.] + + 71e53f8 Tue Mar 19 21:31:41 2013 -0700 + Merge pull request #537 from wishbear/configurableInputFormat + [call setConf from input format if it is Configurable] + + c1e9cdc Sat Mar 16 11:47:45 2013 -0700 + Merge pull request #525 from stephenh/subtractByKey + [Add PairRDDFunctions.subtractByKey.] + + cdbfd1e Fri Mar 15 15:13:28 2013 -0700 + Merge pull request #516 from squito/fix_local_metrics + [Fix local metrics] + + f9fa2ad Fri Mar 15 15:12:43 2013 -0700 + Merge pull request #530 from mbautin/master-update-log4j-and-make-compile-in-IntelliJ + [Add a log4j compile dependency to fix build in IntelliJ] + + 4032beb Wed Mar 13 19:29:46 2013 -0700 + Merge pull request #521 from stephenh/earlyclose + [Close the reader in HadoopRDD as soon as iteration end.] + + 3c97276 Wed Mar 13 19:25:08 2013 -0700 + Merge pull request #524 from andyk/master + [Fix broken link to YARN documentation] + + 1c3d981 Wed Mar 13 19:23:48 2013 -0700 + Merge pull request #517 from Reinvigorate/sm-build-fixes + [Build fixes for streaming /w SBT] + + 2d477fd Wed Mar 13 06:49:16 2013 -0700 + Merge pull request #523 from andyk/master + [Fix broken link in Quick Start] + + 00c4d23 Tue Mar 12 22:19:00 2013 -0700 + Merge pull request #518 from woggling/long-bm-sizes + [Send block sizes as longs in BlockManager updates] + + cbf8f0d Mon Mar 11 00:23:57 2013 -0700 + Merge pull request #513 from MLnick/bagel-caching + [Adds choice of persistence level to Bagel.] + + 91a9d09 Sun Mar 10 15:48:23 2013 -0700 + Merge pull request #512 from patelh/fix-kryo-serializer + [Fix reference bug in Kryo serializer, add test, update version] + + 557cfd0 Sun Mar 10 15:44:57 2013 -0700 + Merge pull request #515 from woggling/deploy-app-death + [Notify standalone deploy client of application death.] + + 04fb81f Sun Mar 3 17:20:07 2013 -0800 + Merge pull request #506 from rxin/spark-706 + [Fixed SPARK-706: Failures in block manager put leads to read task hanging.] + + 6cf4be4 Sun Mar 3 17:16:22 2013 -0800 + Merge pull request #462 from squito/stageInfo + [Track assorted metrics for each task, report summaries to user at stage completion] + + 6bfc7ca Sat Mar 2 22:14:49 2013 -0800 + Merge pull request #504 from mosharaf/master + [Worker address was getting removed when removing an app.] + + 94b3db1 Sat Mar 2 22:13:52 2013 -0800 + Merge pull request #508 from markhamstra/TestServerInUse + [Avoid bind failure in InputStreamsSuite] + + 25c71d3 Fri Mar 1 08:00:18 2013 -0800 + Merge pull request #507 from markhamstra/poms271 + [bump version to 0.7.1-SNAPSHOT in the subproject poms] + diff --git a/dev/create-release/generate-changelist.py b/dev/create-release/generate-changelist.py index 2e1a35a629..916ec90f05 100755 --- a/dev/create-release/generate-changelist.py +++ b/dev/create-release/generate-changelist.py @@ -31,8 +31,8 @@ import time import traceback SPARK_HOME = os.environ["SPARK_HOME"] -NEW_RELEASE_VERSION = "1.0.0" -PREV_RELEASE_GIT_TAG = "v0.9.1" +NEW_RELEASE_VERSION = "1.1.0" +PREV_RELEASE_GIT_TAG = "v1.0.0" CHANGELIST = "CHANGES.txt" OLD_CHANGELIST = "%s.old" % (CHANGELIST) -- cgit v1.2.3