aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--CHANGES.txt14470
-rwxr-xr-xdev/create-release/generate-changelist.py4
2 files changed, 14472 insertions, 2 deletions
diff --git a/CHANGES.txt b/CHANGES.txt
new file mode 100644
index 0000000000..6efb022574
--- /dev/null
+++ b/CHANGES.txt
@@ -0,0 +1,14470 @@
+Spark Change Log
+----------------
+
+Release 1.1.0
+
+ Add line continuation for script to work w/ py2.7.5
+ Matthew Farrellee <matt@redhat.com>
+ 2014-08-27 15:50:30 -0700
+ Commit: d4cf7a0, github.com/apache/spark/pull/2139
+
+ [SPARK-3235][SQL] Ensure in-memory tables don't always broadcast.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-27 15:14:08 -0700
+ Commit: 9a62cf3, github.com/apache/spark/pull/2147
+
+ [SPARK-3065][SQL] Add locale setting to fix results do not match for udf_unix_timestamp format "yyyy MMM dd h:mm:ss a" run with not "America/Los_Angeles" TimeZone in HiveCompatibilitySuite
+ luogankun <luogankun@gmail.com>
+ 2014-08-27 15:08:22 -0700
+ Commit: 5ea260e, github.com/apache/spark/pull/1968
+
+ [SQL] [SPARK-3236] Reading Parquet tables from Metastore mangles location
+ Aaron Davidson <aaron@databricks.com>
+ 2014-08-27 15:05:47 -0700
+ Commit: 7711687, github.com/apache/spark/pull/2150
+
+ [SPARK-3252][SQL] Add missing condition for test
+ viirya <viirya@gmail.com>
+ 2014-08-27 14:55:05 -0700
+ Commit: b3d763b, github.com/apache/spark/pull/2159
+
+ [SPARK-3243] Don't use stale spark-driver.* system properties
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-27 14:46:56 -0700
+ Commit: c1ffa3e, github.com/apache/spark/pull/2154
+
+ Spark-3213 Fixes issue with spark-ec2 not detecting slaves created with "Launch More like this"
+ Vida Ha <vida@databricks.com>
+ 2014-08-27 14:26:06 -0700
+ Commit: 3cb4e17, github.com/apache/spark/pull/2163
+
+ [SPARK-3138][SQL] sqlContext.parquetFile should be able to take a single file as parameter
+ chutium <teng.qiu@gmail.com>
+ 2014-08-27 13:13:04 -0700
+ Commit: 90f8f3e, github.com/apache/spark/pull/2044
+
+ [SPARK-3197] [SQL] Reduce the Expression tree object creations for aggregation function (min/max)
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-08-27 12:50:47 -0700
+ Commit: 4c7f082, github.com/apache/spark/pull/2113
+
+ [SPARK-3118][SQL]add "SHOW TBLPROPERTIES tblname;" and "SHOW COLUMNS (FROM|IN) table_name [(FROM|IN) db_name]" support
+ u0jing <u9jing@gmail.com>
+ 2014-08-27 12:47:14 -0700
+ Commit: 19cda07, github.com/apache/spark/pull/2034
+
+ SPARK-3259 - User data should be given to the master
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-08-27 12:43:22 -0700
+ Commit: 0c94a5b, github.com/apache/spark/pull/2162
+
+ [SPARK-2608][Core] Fixed command line option passing issue over Mesos via SPARK_EXECUTOR_OPTS
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-27 12:39:21 -0700
+ Commit: 935bffe, github.com/apache/spark/pull/2161
+
+ [SPARK-3239] [PySpark] randomize the dirs for each process
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-27 10:40:35 -0700
+ Commit: 092121e, github.com/apache/spark/pull/2152
+
+ [SPARK-3170][CORE][BUG]:RDD info loss in "StorageTab" and "ExecutorTab"
+ uncleGen <hustyugm@gmail.com>
+ 2014-08-27 10:32:13 -0700
+ Commit: 8f8e2a4, github.com/apache/spark/pull/2131
+
+ [SPARK-3154][STREAMING] Make FlumePollingInputDStream shutdown cleaner.
+ Hari Shreedharan <hshreedharan@apache.org>
+ 2014-08-27 02:39:02 -0700
+ Commit: 1d468df, github.com/apache/spark/pull/2065
+
+ [SPARK-3227] [mllib] Added migration guide for v1.0 to v1.1
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-27 01:45:59 -0700
+ Commit: 7286d57, github.com/apache/spark/pull/2146
+
+ [SPARK-2830][MLLIB] doc update for 1.1
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-27 01:19:48 -0700
+ Commit: 7401247, github.com/apache/spark/pull/2151
+
+ [SPARK-3237][SQL] Fix parquet filters with UDFs
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-27 00:59:23 -0700
+ Commit: ca01de1, github.com/apache/spark/pull/2153
+
+ [SPARK-3139] Made ContextCleaner to not block on shuffles
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-08-27 00:13:38 -0700
+ Commit: 5cf1e44, github.com/apache/spark/pull/2143
+
+ HOTFIX: Minor typo in conf template
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-26 23:40:50 -0700
+ Commit: 6f82a4b
+
+ [SPARK-3167] Handle special driver configs in Windows (Branch 1.1)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-26 23:06:11 -0700
+ Commit: e7672f1, github.com/apache/spark/pull/2156
+
+ [SPARK-3224] FetchFailed reduce stages should only show up once in failed stages (in UI)
+ Reynold Xin <rxin@apache.org>, Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-08-26 21:59:48 -0700
+ Commit: 2381e90, github.com/apache/spark/pull/2127
+
+ Fix unclosed HTML tag in Yarn docs.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-26 18:55:00 -0700
+ Commit: 7726e56
+
+ [SPARK-3036][SPARK-3037][SQL] Add MapType/ArrayType containing null value support to Parquet.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-26 18:28:41 -0700
+ Commit: 8b5af6f, github.com/apache/spark/pull/2032
+
+ [Docs] Run tests like in contributing guide
+ nchammas <nicholas.chammas@gmail.com>
+ 2014-08-26 17:50:04 -0700
+ Commit: 0d97233, github.com/apache/spark/pull/2149
+
+ [SPARK-2964] [SQL] Remove duplicated code from spark-sql and start-thriftserver.sh
+ Cheng Lian <lian.cs.zju@gmail.com>, Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-26 17:33:40 -0700
+ Commit: c0e1f99, github.com/apache/spark/pull/1886
+
+ [SPARK-3194][SQL] Add AttributeSet to fix bugs with invalid comparisons of AttributeReferences
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-26 16:29:14 -0700
+ Commit: a308a16, github.com/apache/spark/pull/2109
+
+ [SPARK-2839][MLlib] Stats Toolkit documentation updated
+ Burak <brkyvz@gmail.com>
+ 2014-08-26 15:18:42 -0700
+ Commit: 2715eb7, github.com/apache/spark/pull/2130
+
+ [SPARK-3226][MLLIB] doc update for native libraries
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-26 15:12:27 -0700
+ Commit: 5ff9000, github.com/apache/spark/pull/2128
+
+ [SPARK-3063][SQL] ExistingRdd should convert Map to catalyst Map.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-26 15:04:08 -0700
+ Commit: 5d981a4, github.com/apache/spark/pull/1963
+
+ [SPARK-2969][SQL] Make ScalaReflection be able to handle ArrayType.containsNull and MapType.valueContainsNull.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-26 13:22:55 -0700
+ Commit: 35a5853, github.com/apache/spark/pull/1889
+
+ [SPARK-2871] [PySpark] add histgram() API
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-26 13:04:30 -0700
+ Commit: 83d2730, github.com/apache/spark/pull/2091
+
+ [SPARK-3131][SQL] Allow user to set parquet compression codec for writing ParquetFile in SQLContext
+ chutium <teng.qiu@gmail.com>
+ 2014-08-26 11:51:26 -0700
+ Commit: 3a9d874, github.com/apache/spark/pull/2039
+
+ [SPARK-2886] Use more specific actor system name than "spark"
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-25 23:36:09 -0700
+ Commit: 0f947f1, github.com/apache/spark/pull/1810
+
+ [Spark-3222] [SQL] Cross join support in HiveQL
+ Daoyuan Wang <daoyuan.wang@intel.com>, adrian-wang <daoyuanwong@gmail.com>
+ 2014-08-25 22:56:35 -0700
+ Commit: 48a0749, github.com/apache/spark/pull/2124
+
+ SPARK-2481: The environment variables SPARK_HISTORY_OPTS is covered in spark-env.sh
+ witgo <witgo@qq.com>, GuoQiang Li <witgo@qq.com>
+ 2014-08-25 19:22:27 -0700
+ Commit: 4d6a0e9, github.com/apache/spark/pull/1341
+
+ [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile
+ Chia-Yung Su <chiayung@appier.com>
+ 2014-08-25 18:20:19 -0700
+ Commit: b5dc9b4, github.com/apache/spark/pull/1959
+
+ [SQL] logWarning should be logInfo in getResultSetSchema
+ wangfei <wangfei_hello@126.com>
+ 2014-08-25 17:46:43 -0700
+ Commit: 957b356, github.com/apache/spark/pull/1939
+
+ [SPARK-3058] [SQL] Support EXTENDED for EXPLAIN
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-08-25 17:43:56 -0700
+ Commit: f8ac8ed, github.com/apache/spark/pull/1962
+
+ [SPARK-2929][SQL] Refactored Thrift server and CLI suites
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-25 16:29:59 -0700
+ Commit: 292f28d, github.com/apache/spark/pull/1856
+
+ [SPARK-3204][SQL] MaxOf would be foldable if both left and right are foldable.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-25 16:27:00 -0700
+ Commit: 19b01d6, github.com/apache/spark/pull/2116
+
+ Fixed a typo in docs/running-on-mesos.md
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-25 14:56:51 -0700
+ Commit: 8d33a6d, github.com/apache/spark/pull/2119
+
+ [FIX] fix error message in sendMessageReliably
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-25 14:55:20 -0700
+ Commit: d892062, github.com/apache/spark/pull/2120
+
+ SPARK-2798 [BUILD] Correct several small errors in Flume module pom.xml files
+ Sean Owen <sowen@cloudera.com>
+ 2014-08-25 13:29:07 -0700
+ Commit: ff616fd, github.com/apache/spark/pull/1726
+
+ [SPARK-2495][MLLIB] make KMeans constructor public
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-25 12:30:02 -0700
+ Commit: 69a17f1, github.com/apache/spark/pull/2112
+
+ [SPARK-2871] [PySpark] add zipWithIndex() and zipWithUniqueId()
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-24 21:16:05 -0700
+ Commit: b82da3d, github.com/apache/spark/pull/2092
+
+ [MLlib][SPARK-2997] Update SVD documentation to reflect roughly square
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-08-24 17:35:54 -0700
+ Commit: 749bddc, github.com/apache/spark/pull/2070
+
+ [SPARK-2841][MLlib] Documentation for feature transformations
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-08-24 17:33:33 -0700
+ Commit: a4db81a, github.com/apache/spark/pull/2068
+
+ [SPARK-3192] Some scripts have 2 space indentation but other scripts have 4 space indentation.
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-24 09:43:44 -0700
+ Commit: ce14cd1, github.com/apache/spark/pull/2104
+
+ [SPARK-2967][SQL] Follow-up: Also copy hash expressions in sort based shuffle fix.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-23 16:21:08 -0700
+ Commit: e23f0bc, github.com/apache/spark/pull/2072
+
+ [SPARK-2554][SQL] CountDistinct partial aggregation and object allocation improvements
+ Michael Armbrust <michael@databricks.com>, Gregory Owen <greowen@gmail.com>
+ 2014-08-23 16:19:10 -0700
+ Commit: 7112da8, github.com/apache/spark/pull/1935
+
+ [SQL] Make functionRegistry in HiveContext transient.
+ Yin Huai <huaiyin.thu@gmail.com>
+ 2014-08-23 12:46:41 -0700
+ Commit: 9309786, github.com/apache/spark/pull/2074
+
+ [SPARK-2963] REGRESSION - The description about how to build for using CLI and Thrift JDBC server is absent in proper document -
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-22 22:28:05 -0700
+ Commit: 5689660, github.com/apache/spark/pull/2080
+
+ [SPARK-3169] Removed dependency on spark streaming test from spark flume sink
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-08-22 21:34:48 -0700
+ Commit: cd73631, github.com/apache/spark/pull/2101
+
+ Revert "HOTFIX:Temporarily removing flume sink test in 1.1 branch"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-22 21:31:52 -0700
+ Commit: 385c4f2
+
+ [SPARK-2840] [mllib] DecisionTree doc update (Java, Python examples)
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-21 00:17:29 -0700
+ Commit: 1e5d9cb, github.com/apache/spark/pull/2063
+
+ BUILD: Bump Hadoop versions in the release build.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-20 12:18:41 -0700
+ Commit: da0a701
+
+ HOTFIX:Temporarily removing flume sink test in 1.1 branch
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-20 22:24:22 -0700
+ Commit: 1d5e84a
+
+ [HOTFIX][STREAMING] Allow the JVM/Netty to decide which port to bind to in Flume Polling Tests.
+ Hari Shreedharan <harishreedharan@gmail.com>
+ 2014-08-17 19:50:31 -0700
+ Commit: 4485665, github.com/apache/spark/pull/1820
+
+ [HOTFIX][Streaming] Handle port collisions in flume polling test
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-06 16:34:53 -0700
+ Commit: 3f91e9d, github.com/apache/spark/pull/1803
+
+ [SPARK-2843][MLLIB] add a section about regularization parameter in ALS
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-20 17:47:39 -0700
+ Commit: eba399b, github.com/apache/spark/pull/2064
+
+ [SPARK-3143][MLLIB] add tf-idf user guide
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-20 17:41:36 -0700
+ Commit: 1af68ca, github.com/apache/spark/pull/2061
+
+ [SPARK-3140] Clarify confusing PySpark exception message
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-20 17:07:39 -0700
+ Commit: f8bcb12, github.com/apache/spark/pull/2067
+
+ [SPARK-2298] Encode stage attempt in SparkListener & UI.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-20 15:37:27 -0700
+ Commit: dc05282, github.com/apache/spark/pull/1545
+
+ [SPARK-2169] Don't copy appName / basePath everywhere.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-08-18 13:25:30 -0700
+ Commit: 2c1683e, github.com/apache/spark/pull/1252
+
+ [SPARK-2846][SQL] Add configureInputJobPropertiesForStorageHandler to initialization of job conf
+ Alex Liu <alex_liu68@yahoo.com>
+ 2014-08-20 16:14:06 -0700
+ Commit: 64e136a, github.com/apache/spark/pull/1927
+
+ SPARK_LOGFILE and SPARK_ROOT_LOGGER no longer need in spark-daemon.sh
+ wangfei <wangfei_hello@126.com>
+ 2014-08-20 16:00:46 -0700
+ Commit: 5f72d7b, github.com/apache/spark/pull/2057
+
+ [SPARK-2967][SQL] Fix sort based shuffle for spark sql.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-20 15:51:14 -0700
+ Commit: 311831d, github.com/apache/spark/pull/2066
+
+ [SPARK-2849] Handle driver configs separately in client mode
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-20 15:01:47 -0700
+ Commit: beb705a, github.com/apache/spark/pull/1845
+
+ [SPARK-3149] Connection establishment information is not enough.
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-20 14:04:39 -0700
+ Commit: 25b01fd, github.com/apache/spark/pull/2060
+
+ [SPARK-3062] [SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-20 13:26:11 -0700
+ Commit: 5095851, github.com/apache/spark/pull/1970
+
+ [SPARK-3126][SPARK-3127][SQL] Fixed HiveThriftServer2Suite
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-20 12:57:39 -0700
+ Commit: 99ca704, github.com/apache/spark/pull/2036
+
+ SPARK-3092 [SQL]: Always include the thriftserver when -Phive is enabled.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-20 12:13:31 -0700
+ Commit: ca7322d, github.com/apache/spark/pull/2006
+
+ [SPARK-3054][STREAMING] Add unit tests for Spark Sink.
+ Hari Shreedharan <hshreedharan@apache.org>, Hari Shreedharan <hshreedharan@cloudera.com>
+ 2014-08-20 04:09:54 -0700
+ Commit: 9b29099, github.com/apache/spark/pull/1958
+
+ [SPARK-3141] [PySpark] fix sortByKey() with take()
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-19 22:43:49 -0700
+ Commit: 5b22ebf, github.com/apache/spark/pull/2045
+
+ [DOCS] Fixed wrong links
+ Ken Takagiwa <ugw.gi.world@gmail.com>
+ 2014-08-19 22:43:22 -0700
+ Commit: f8c908e, github.com/apache/spark/pull/2042
+
+ [SPARK-2974] [SPARK-2975] Fix two bugs related to spark.local.dirs
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-19 22:42:50 -0700
+ Commit: 5d1a878, github.com/apache/spark/pull/2002
+
+ [SPARK-3142][MLLIB] output shuffle data directly in Word2Vec
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-19 22:16:22 -0700
+ Commit: a5bc9c6, github.com/apache/spark/pull/2049
+
+ [SPARK-3119] Re-implementation of TorrentBroadcast.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-19 22:11:13 -0700
+ Commit: 08c9973, github.com/apache/spark/pull/2030
+
+ [HOTFIX][Streaming][MLlib] use temp folder for checkpoint
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-19 22:05:29 -0700
+ Commit: d5db95b, github.com/apache/spark/pull/2046
+
+ [SPARK-3130][MLLIB] detect negative values in naive Bayes
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-19 21:01:23 -0700
+ Commit: 148e45b, github.com/apache/spark/pull/2038
+
+ [SQL] add note of use synchronizedMap in SQLConf
+ wangfei <wangfei_hello@126.com>, scwf <wangfei1@huawei.com>
+ 2014-08-19 19:37:02 -0700
+ Commit: 607735c, github.com/apache/spark/pull/1996
+
+ [SPARK-3112][MLLIB] Add documentation and example for StreamingLR
+ freeman <the.freeman.lab@gmail.com>
+ 2014-08-19 18:07:42 -0700
+ Commit: d75464d, github.com/apache/spark/pull/2047
+
+ [MLLIB] minor update to word2vec
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-19 17:41:37 -0700
+ Commit: 023ed7c, github.com/apache/spark/pull/2043
+
+ [SPARK-2468] Netty based block server / client module
+ Reynold Xin <rxin@apache.org>
+ 2014-08-19 17:40:35 -0700
+ Commit: 66b4c81, github.com/apache/spark/pull/1971
+
+ [SPARK-3136][MLLIB] Create Java-friendly methods in RandomRDDs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-19 16:06:48 -0700
+ Commit: d371c71, github.com/apache/spark/pull/2041
+
+ [SPARK-2790] [PySpark] fix zip with serializers which have different batch sizes.
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-19 14:46:32 -0700
+ Commit: 3540d4b, github.com/apache/spark/pull/1894
+
+ Move a bracket in validateSettings of SparkConf
+ hzw19900416 <carlmartinmax@gmail.com>
+ 2014-08-19 14:04:49 -0700
+ Commit: f6b4ab8, github.com/apache/spark/pull/2012
+
+ SPARK-2333 - spark_ec2 script should allow option for existing security group
+ Vida Ha <vida@databricks.com>
+ 2014-08-19 13:35:05 -0700
+ Commit: c3952b0, github.com/apache/spark/pull/1899
+
+ [SPARK-3128][MLLIB] Use streaming test suite for StreamingLR
+ freeman <the.freeman.lab@gmail.com>
+ 2014-08-19 13:28:57 -0700
+ Commit: 04a3208, github.com/apache/spark/pull/2037
+
+ [SPARK-3089] Fix meaningless error message in ConnectionManager
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-19 10:15:11 -0700
+ Commit: 5d895ad, github.com/apache/spark/pull/2000
+
+ [SPARK-3072] YARN - Exit when reach max number failed executors
+ Thomas Graves <tgraves@apache.org>
+ 2014-08-19 09:40:31 -0500
+ Commit: 1418893, github.com/apache/spark/pull/2022
+
+ Fix typo in decision tree docs
+ Matt Forbes <matt@tellapart.com>
+ 2014-08-18 21:43:32 -0700
+ Commit: f3b0f34, github.com/apache/spark/pull/1837
+
+ [SPARK-3116] Remove the excessive lockings in TorrentBroadcast
+ Reynold Xin <rxin@apache.org>
+ 2014-08-18 20:51:41 -0700
+ Commit: b6d8e66, github.com/apache/spark/pull/2028
+
+ [SPARK-3114] [PySpark] Fix Python UDFs in Spark SQL.
+ Josh Rosen <joshrosen@apache.org>, Davies Liu <davies.liu@gmail.com>
+ 2014-08-18 20:42:19 -0700
+ Commit: 3a03259, github.com/apache/spark/pull/2026.
+
+ [SPARK-3108][MLLIB] add predictOnValues to StreamingLR and fix predictOn
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-18 18:20:54 -0700
+ Commit: 7d069bf, github.com/apache/spark/pull/2023
+
+ [SPARK-2850] [SPARK-2626] [mllib] MLlib stats examples + small fixes
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-18 18:01:39 -0700
+ Commit: e3f89e9, github.com/apache/spark/pull/1878
+
+ [mllib] DecisionTree: treeAggregate + Python example bug fix
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-18 14:40:05 -0700
+ Commit: 98778ff, github.com/apache/spark/pull/2015
+
+ [SPARK-2718] [yarn] Handle quotes and other characters in user args.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-08-18 14:10:10 -0700
+ Commit: 25cabd7, github.com/apache/spark/pull/1724
+
+ [SPARK-3103] [PySpark] fix saveAsTextFile() with utf-8
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-18 13:58:35 -0700
+ Commit: e083334, github.com/apache/spark/pull/2018
+
+ [SPARK-2406][SQL] Initial support for using ParquetTableScan to read HiveMetaStore tables.
+ Michael Armbrust <michael@databricks.com>, Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-18 13:17:10 -0700
+ Commit: cc4015d, github.com/apache/spark/pull/1819
+
+ [SPARK-3091] [SQL] Add support for caching metadata on Parquet files
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-18 11:00:10 -0700
+ Commit: 2ae2857, github.com/apache/spark/pull/2005
+
+ SPARK-3025 [SQL]: Allow JDBC clients to set a fair scheduler pool
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-18 10:52:20 -0700
+ Commit: 496f62d, github.com/apache/spark/pull/1937
+
+ [SPARK-3085] [SQL] Use compact data structures in SQL joins
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-18 10:45:24 -0700
+ Commit: 4da76fc, github.com/apache/spark/pull/1993
+
+ [SPARK-3084] [SQL] Collect broadcasted tables in parallel in joins
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-18 10:05:52 -0700
+ Commit: 55e9dd6, github.com/apache/spark/pull/1990
+
+ SPARK-3096: Include parquet hive serde by default in build
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-18 10:00:46 -0700
+ Commit: ec0b91e, github.com/apache/spark/pull/2009
+
+ [SPARK-2862] histogram method fails on some choices of bucketCount
+ Chandan Kumar <chandan.kumar@imaginea.com>
+ 2014-08-18 09:52:25 -0700
+ Commit: 12f16ba, github.com/apache/spark/pull/1787
+
+ [MLlib] Remove transform(dataset: RDD[String]) from Word2Vec public API
+ Liquan Pei <liquanpei@gmail.com>
+ 2014-08-18 01:15:45 -0700
+ Commit: e0bc333, github.com/apache/spark/pull/2010
+
+ [SPARK-2842][MLlib]Word2Vec documentation
+ Liquan Pei <liquanpei@gmail.com>
+ 2014-08-17 23:30:47 -0700
+ Commit: 518258f, github.com/apache/spark/pull/2003
+
+ [SPARK-3097][MLlib] Word2Vec performance improvement
+ Liquan Pei <liquanpei@gmail.com>
+ 2014-08-17 23:29:44 -0700
+ Commit: 708cde9, github.com/apache/spark/pull/1932
+
+ SPARK-2900. aggregate inputBytes per stage
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-08-17 22:39:06 -0700
+ Commit: 0506539, github.com/apache/spark/pull/1826
+
+ SPARK-2884: Create binary builds in parallel with release script.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-17 22:29:58 -0700
+ Commit: a5ae720
+
+ [SPARK-3087][MLLIB] fix col indexing bug in chi-square and add a check for number of distinct values
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-17 20:53:18 -0700
+ Commit: 8438daf, github.com/apache/spark/pull/1997
+
+ [SPARK-1981] updated streaming-kinesis.md
+ Chris Fregly <chris@fregly.com>
+ 2014-08-17 19:33:15 -0700
+ Commit: 8263567, github.com/apache/spark/pull/1757
+
+ [SQL] Improve debug logging and toStrings.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-17 19:00:38 -0700
+ Commit: 4f776df, github.com/apache/spark/pull/2004
+
+ Revert "[SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled"
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-17 18:10:45 -0700
+ Commit: c6a0091, github.com/apache/spark/pull/2007
+
+ SPARK-2881: Upgrade to Snappy 1.0.5.3 to avoid SPARK-2881.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-17 15:48:39 -0700
+ Commit: d411f41, github.com/apache/spark/pull/1999
+
+ [SPARK-3042] [mllib] DecisionTree Filter top-down instead of bottom-up
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-16 23:53:14 -0700
+ Commit: 91af120, github.com/apache/spark/pull/1975
+
+ [SPARK-3077][MLLIB] fix some chisq-test
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-16 21:16:27 -0700
+ Commit: 413a329, github.com/apache/spark/pull/1982
+
+ In the stop method of ConnectionManager to cancel the ackTimeoutMonitor
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-16 20:05:55 -0700
+ Commit: f02e327, github.com/apache/spark/pull/1989
+
+ [SPARK-1065] [PySpark] improve supporting for large broadcast
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-16 16:59:34 -0700
+ Commit: 5dd571c, github.com/apache/spark/pull/1912
+
+ [SPARK-3035] Wrong example with SparkContext.addFile
+ iAmGhost <kdh7807@gmail.com>
+ 2014-08-16 16:48:38 -0700
+ Commit: 721f2fd, github.com/apache/spark/pull/1942
+
+ [SPARK-3081][MLLIB] rename RandomRDDGenerators to RandomRDDs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-16 15:14:43 -0700
+ Commit: a12d3ae, github.com/apache/spark/pull/1979
+
+ [SPARK-3048][MLLIB] add LabeledPoint.parse and remove loadStreamingLabeledPoints
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-16 15:13:34 -0700
+ Commit: 0b354be, github.com/apache/spark/pull/1952
+
+ [SPARK-2677] BasicBlockFetchIterator#next can wait forever
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-16 14:15:58 -0700
+ Commit: bd3ce2f, github.com/apache/spark/pull/1632
+
+ [SQL] Using safe floating-point numbers in doctest
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-16 11:26:51 -0700
+ Commit: 8c79574, github.com/apache/spark/pull/1925
+
+ [SPARK-2977] Ensure ShuffleManager is created before ShuffleBlockManager
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-16 00:04:55 -0700
+ Commit: 0e0ec2e, github.com/apache/spark/pull/1976
+
+ [SPARK-3045] Make Serializer interface Java friendly
+ Reynold Xin <rxin@apache.org>
+ 2014-08-15 23:12:34 -0700
+ Commit: fcf30cd, github.com/apache/spark/pull/1948
+
+ [SPARK-3015] Block on cleaning tasks to prevent Akka timeouts
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-15 22:55:32 -0700
+ Commit: 2541537, github.com/apache/spark/pull/1931
+
+ [SPARK-3001][MLLIB] Improve Spearman's correlation
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-15 21:07:55 -0700
+ Commit: ce06d7f, github.com/apache/spark/pull/1917
+
+ [SPARK-3078][MLLIB] Make LRWithLBFGS API consistent with others
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-15 21:04:29 -0700
+ Commit: c085011, github.com/apache/spark/pull/1973
+
+ [SPARK-3046] use executor's class loader as the default serializer classloader
+ Reynold Xin <rxin@apache.org>
+ 2014-08-15 17:04:15 -0700
+ Commit: 077213b, github.com/apache/spark/pull/1972
+
+ [SPARK-3022] [SPARK-3041] [mllib] Call findBins once per level + unordered feature bug fix
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-15 14:50:10 -0700
+ Commit: 407ea9f, github.com/apache/spark/pull/1950
+
+ SPARK-3028. sparkEventToJson should support SparkListenerExecutorMetrics...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-08-15 11:35:08 -0700
+ Commit: 63376a0, github.com/apache/spark/pull/1961
+
+ Revert "[SPARK-2468] Netty based block server / client module"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-15 09:01:35 -0700
+ Commit: b066af4
+
+ [SPARK-2924] remove default args to overloaded methods
+ Anand Avati <avati@redhat.com>
+ 2014-08-15 08:53:52 -0700
+ Commit: debb3e3, github.com/apache/spark/pull/1704
+
+ [SPARK-2468] Netty based block server / client module
+ Reynold Xin <rxin@apache.org>
+ 2014-08-14 19:01:33 -0700
+ Commit: 3f23d2a, github.com/apache/spark/pull/1907
+
+ [SPARK-2936] Migrate Netty network module from Java to Scala
+ Reynold Xin <rxin@apache.org>
+ 2014-08-10 20:36:54 -0700
+ Commit: d3cce58, github.com/apache/spark/pull/1865
+
+ [SPARK-2736] PySpark converter and example script for reading Avro files
+ Kan Zhang <kzhang@apache.org>
+ 2014-08-14 19:03:51 -0700
+ Commit: 72e730e, github.com/apache/spark/pull/1916
+
+ [SPARK-3027] TaskContext: tighten visibility and provide Java friendly callback API
+ Reynold Xin <rxin@apache.org>
+ 2014-08-14 18:37:02 -0700
+ Commit: f99e4fc, github.com/apache/spark/pull/1938
+
+ Make dev/mima runnable on Mac OS X.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-14 16:27:11 -0700
+ Commit: 475a35b, github.com/apache/spark/pull/1953
+
+ SPARK-3009: Reverted readObject method in ApplicationInfo so that Applic...
+ Jacek Lewandowski <lewandowski.jacek@gmail.com>
+ 2014-08-14 15:01:39 -0700
+ Commit: f5d9176, github.com/apache/spark/pull/1947
+
+ Revert [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-14 13:00:21 -0700
+ Commit: c39a3f3, github.com/apache/spark/pull/1949
+
+ [SPARK-2979][MLlib] Improve the convergence rate by minimizing the condition number
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-08-14 11:56:13 -0700
+ Commit: dc8ef93, github.com/apache/spark/pull/1897
+
+ Minor cleanup of metrics.Source
+ Reynold Xin <rxin@apache.org>
+ 2014-08-14 11:22:41 -0700
+ Commit: a3dc54f, github.com/apache/spark/pull/1943
+
+ [SPARK-2925] [sql]fix spark-sql and start-thriftserver shell bugs when set --driver-java-options
+ wangfei <wangfei_hello@126.com>, wangfei <wangfei1@huawei.com>
+ 2014-08-14 10:55:51 -0700
+ Commit: df25acd, github.com/apache/spark/pull/1851
+
+ [SQL] Python JsonRDD UTF8 Encoding Fix
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-08-14 10:48:52 -0700
+ Commit: 850abaa, github.com/apache/spark/pull/1914
+
+ [SPARK-2927][SQL] Add a conf to configure if we always read Binary columns stored in Parquet as String columns
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-14 10:46:33 -0700
+ Commit: de501e1, github.com/apache/spark/pull/1855
+
+ [SPARK-3011][SQL] _temporary directory should be filtered out by sqlContext.parquetFile
+ Chia-Yung Su <chiayung@appier.com>
+ 2014-08-14 10:43:08 -0700
+ Commit: 221c84e, github.com/apache/spark/pull/1924
+
+ SPARK-2893: Do not swallow Exceptions when running a custom kryo registrator
+ Graham Dennis <graham.dennis@gmail.com>
+ 2014-08-14 02:24:18 -0700
+ Commit: af809de, github.com/apache/spark/pull/1827
+
+ [SPARK-3029] Disable local execution of Spark jobs by default
+ Aaron Davidson <aaron@databricks.com>
+ 2014-08-14 01:37:38 -0700
+ Commit: 0cb2b82, github.com/apache/spark/pull/1321
+
+ [SPARK-2995][MLLIB] add ALS.setIntermediateRDDStorageLevel
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-13 23:53:44 -0700
+ Commit: 1baf06f, github.com/apache/spark/pull/1913
+
+ [Docs] Add missing <code> tags (minor)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-13 23:24:23 -0700
+ Commit: bf7c6e1, github.com/apache/spark/pull/1936
+
+ [SPARK-3006] Failed to execute spark-shell in Windows OS
+ Masayoshi TSUZUKI <tsudukim@oss.nttdata.co.jp>
+ 2014-08-13 22:17:07 -0700
+ Commit: dcd99c3, github.com/apache/spark/pull/1918
+
+ SPARK-3020: Print completed indices rather than tasks in web UI
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-13 18:08:38 -0700
+ Commit: c6cb55a, github.com/apache/spark/pull/1933
+
+ [SPARK-2986] [SQL] fixed: setting properties does not effect
+ guowei <guowei@upyoo.com>
+ 2014-08-13 17:45:24 -0700
+ Commit: a8d2649, github.com/apache/spark/pull/1904
+
+ [SPARK-2970] [SQL] spark-sql script ends with IOException when EventLogging is enabled
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-13 17:42:38 -0700
+ Commit: b5b632c, github.com/apache/spark/pull/1891
+
+ [SPARK-2935][SQL]Fix parquet predicate push down bug
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-13 17:40:59 -0700
+ Commit: e8e7f17, github.com/apache/spark/pull/1863
+
+ [SPARK-2650][SQL] More precise initial buffer size estimation for in-memory column buffer
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-13 17:37:55 -0700
+ Commit: ee7d2cc, github.com/apache/spark/pull/1901
+
+ [SPARK-2994][SQL] Support for udfs that take complex types
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-13 17:35:38 -0700
+ Commit: 71b8408, github.com/apache/spark/pull/1915
+
+ [SPARK-2817] [SQL] add "show create table" support
+ tianyi <tianyi@asiainfo-linkage.com>, tianyi <tianyi@asiainfo.com>, tianyi <tianyi.asiainfo@gmail.com>
+ 2014-08-13 16:50:02 -0700
+ Commit: 0fb1198, github.com/apache/spark/pull/1760
+
+ [SPARK-3004][SQL] Added null checking when retrieving row set
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-13 16:27:50 -0700
+ Commit: 8732375, github.com/apache/spark/pull/1920
+
+ [MLLIB] use Iterator.fill instead of Array.fill
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-13 16:20:49 -0700
+ Commit: e63bf87, github.com/apache/spark/pull/1930
+
+ [SPARK-2983] [PySpark] improve performance of sortByKey()
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-13 14:57:12 -0700
+ Commit: a7bc21c, github.com/apache/spark/pull/1898
+
+ [SPARK-3013] [SQL] [PySpark] convert array into list
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-13 14:56:11 -0700
+ Commit: 9936020, github.com/apache/spark/pull/1928
+
+ [SPARK-2963] [SQL] There no documentation about building to use HiveServer and CLI for SparkSQL
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-13 14:42:57 -0700
+ Commit: 78f2f99, github.com/apache/spark/pull/1885
+
+ [SPARK-2993] [MLLib] colStats (wrapper around MultivariateStatisticalSummary) in Statistics
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-08-12 23:47:42 -0700
+ Commit: 5ebeb3f, github.com/apache/spark/pull/1911
+
+ [SPARK-1777 (partial)] bugfix: make size of requested memory correctly
+ Zhang, Liye <liye.zhang@intel.com>
+ 2014-08-12 23:43:36 -0700
+ Commit: ec5e2b0, github.com/apache/spark/pull/1892
+
+ Use transferTo when copy merge files in ExternalSorter
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-08-12 23:19:35 -0700
+ Commit: be674b3, github.com/apache/spark/pull/1884
+
+ [SPARK-2953] Allow using short names for io compression codecs
+ Reynold Xin <rxin@apache.org>
+ 2014-08-12 22:50:29 -0700
+ Commit: 837bf60, github.com/apache/spark/pull/1873
+
+ SPARK-2830 [MLlib]: re-organize mllib documentation
+ Ameet Talwalkar <atalwalkar@gmail.com>
+ 2014-08-12 17:15:21 -0700
+ Commit: cffd9bb, github.com/apache/spark/pull/1908
+
+ fix flaky tests
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-12 16:26:01 -0700
+ Commit: b5f8083, github.com/apache/spark/pull/1910
+
+ [MLlib] Correctly set vectorSize and alpha
+ Liquan Pei <liquanpei@gmail.com>
+ 2014-08-12 00:28:00 -0700
+ Commit: 2a8117a, github.com/apache/spark/pull/1900
+
+ [SPARK-2923][MLLIB] Implement some basic BLAS routines
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-11 22:33:45 -0700
+ Commit: 872c170, github.com/apache/spark/pull/1849
+
+ [SQL] [SPARK-2826] Reduce the memory copy while building the hashmap for HashOuterJoin
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-08-11 20:45:14 -0700
+ Commit: f66f260, github.com/apache/spark/pull/1765
+
+ [SPARK-2650][SQL] Build column buffers in smaller batches
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-11 20:21:56 -0700
+ Commit: 779d1eb, github.com/apache/spark/pull/1880
+
+ [SPARK-2968][SQL] Fix nullabilities of Explode.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-11 20:18:03 -0700
+ Commit: 54b387f, github.com/apache/spark/pull/1888
+
+ [SPARK-2965][SQL] Fix HashOuterJoin output nullabilities.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-08-11 20:15:01 -0700
+ Commit: dcbf079, github.com/apache/spark/pull/1887
+
+ [SQL] A tiny refactoring in HiveContext#analyze
+ Yin Huai <huaiyin.thu@gmail.com>
+ 2014-08-11 20:11:29 -0700
+ Commit: fd8173f, github.com/apache/spark/pull/1881
+
+ [sql]use SparkSQLEnv.stop() in ShutdownHook
+ wangfei <wangfei1@huawei.com>
+ 2014-08-11 20:10:13 -0700
+ Commit: 6d0af52, github.com/apache/spark/pull/1852
+
+ [SPARK-2590][SQL] Added option to handle incremental collection, disabled by default
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-11 20:08:06 -0700
+ Commit: cf2f807, github.com/apache/spark/pull/1853
+
+ [SPARK-2844][SQL] Correctly set JVM HiveContext if it is passed into Python HiveContext constructor
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-08-11 20:06:06 -0700
+ Commit: 8cb4e5b, github.com/apache/spark/pull/1768
+
+ [SPARK-2934][MLlib] Adding LogisticRegressionWithLBFGS Interface
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-08-11 19:49:29 -0700
+ Commit: 8f6e2e9, github.com/apache/spark/pull/1862
+
+ [SPARK-2515][mllib] Chi Squared test
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-08-11 19:22:14 -0700
+ Commit: 7e31f7c, github.com/apache/spark/pull/1733
+
+ [SPARK-2931] In TaskSetManager, reset currentLocalityIndex after recomputing locality levels
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-11 19:15:01 -0700
+ Commit: 6c64d57, github.com/apache/spark/pull/1896
+
+ [SPARK-2952] Enable logging actor messages at DEBUG level
+ Reynold Xin <rxin@apache.org>
+ 2014-08-11 15:25:21 -0700
+ Commit: 6ec1374, github.com/apache/spark/pull/1870
+
+ [PySpark] [SPARK-2954] [SPARK-2948] [SPARK-2910] [SPARK-2101] Python 2.6 Fixes
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-11 11:54:09 -0700
+ Commit: 09b8a3c, github.com/apache/spark/pull/1868.
+
+ [SPARK-2937] Separate out samplyByKeyExact as its own API in PairRDDFunction
+ Doris Xin <doris.s.xin@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-08-10 16:31:07 -0700
+ Commit: 3def842, github.com/apache/spark/pull/1866
+
+ [SPARK-2898] [PySpark] fix bugs in deamon.py
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-10 13:00:38 -0700
+ Commit: 92daffe, github.com/apache/spark/pull/1842
+
+ Remove extra semicolon in Task.scala
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-10 12:12:22 -0700
+ Commit: bb23b11, github.com/apache/spark/pull/1876
+
+ Turn UpdateBlockInfo into case class.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-09 23:06:54 -0700
+ Commit: 076ddda, github.com/apache/spark/pull/1872
+
+ Updated Spark SQL README to include the hive-thriftserver module
+ Reynold Xin <rxin@apache.org>
+ 2014-08-09 22:05:36 -0700
+ Commit: e8f8e5f, github.com/apache/spark/pull/1867
+
+ [SPARK-2894] spark-shell doesn't accept flags
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>, Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-09 21:10:43 -0700
+ Commit: ba223b8, github.com/apache/spark/pull/1715,
+
+ [SPARK-1766] sorted functions to meet pedantic requirements
+ Chris Cope <ccope@resilientscience.com>
+ 2014-08-09 20:58:56 -0700
+ Commit: 4a7f3ef, github.com/apache/spark/pull/1859
+
+ [SPARK-2861] Fix Doc comment of histogram method
+ Chandan Kumar <chandan.kumar@imaginea.com>
+ 2014-08-09 00:45:54 -0700
+ Commit: 71fcd2e, github.com/apache/spark/pull/1786
+
+ [SPARK-2635] Fix race condition at SchedulerBackend.isReady in standalone mode
+ li-zhihui <zhihui.li@intel.com>, Li Zhihui <zhihui.li@intel.com>
+ 2014-08-08 22:52:56 -0700
+ Commit: 3311da2, github.com/apache/spark/pull/1525
+
+ [SPARK-2897][SPARK-2920]TorrentBroadcast does use the serializer class specified in the spark option "spark.serializer"
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-08 16:57:26 -0700
+ Commit: dd11e4e, github.com/apache/spark/pull/1836
+
+ [SPARK-1997][MLLIB] update breeze to 0.9
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-08 15:07:31 -0700
+ Commit: 8fba6de, github.com/apache/spark/pull/1749
+
+ [SPARK-2700] [SQL] Hidden files (such as .impala_insert_staging) should be filtered out by sqlContext.parquetFile
+ chutium <teng.qiu@gmail.com>
+ 2014-08-08 13:31:08 -0700
+ Commit: e264503, github.com/apache/spark/pull/1691
+
+ [SPARK-2919] [SQL] Basic support for analyze command in HiveQl
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-08 11:23:58 -0700
+ Commit: daa090f, github.com/apache/spark/pull/1848
+
+ [SPARK-2877] [SQL] MetastoreRelation should use SparkClassLoader when creating the tableDesc
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-08 11:15:16 -0700
+ Commit: 8b0188b, github.com/apache/spark/pull/1806
+
+ [SPARK-2908] [SQL] JsonRDD.nullTypeToStringType does not convert all NullType to StringType
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-08 11:10:11 -0700
+ Commit: 544a909, github.com/apache/spark/pull/1840
+
+ [SPARK-2888] [SQL] Fix addColumnMetadataToConf in HiveTableScan
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-08 11:01:51 -0700
+ Commit: 3eb5dd0, github.com/apache/spark/pull/1817
+
+ [SPARK-2904] Remove non-used local variable in SparkSubmitArguments
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-07 18:53:15 -0700
+ Commit: a54b5d9, github.com/apache/spark/pull/1834
+
+ SPARK-2565. Update ShuffleReadMetrics as blocks are fetched
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-08-07 18:09:03 -0700
+ Commit: aab7735, github.com/apache/spark/pull/1507
+
+ SPARK-2787: Make sort-based shuffle write files directly when there's no sorting/aggregation and # partitions is small
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-07 18:04:49 -0700
+ Commit: 0f2274f, github.com/apache/spark/pull/1799
+
+ SPARK-2899 Doc generation is back to working in new SBT Build.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-08-07 16:24:22 -0700
+ Commit: 30369b8, github.com/apache/spark/pull/1830
+
+ SPARK-2905 Fixed path sbin => bin
+ Oleg Danilov <oleg.danilov@wandisco.com>
+ 2014-08-07 15:48:44 -0700
+ Commit: c65c810, github.com/apache/spark/pull/1835
+
+ [SPARK-2852][MLLIB] Separate model from IDF/StandardScaler algorithms
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-07 11:28:12 -0700
+ Commit: f705c1d, github.com/apache/spark/pull/1814
+
+ [mllib] DecisionTree Strategy parameter checks
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-07 00:20:38 -0700
+ Commit: c089429, github.com/apache/spark/pull/1821
+
+ SPARK-2879 part 2 [BUILD] Use HTTPS to access Maven Central and other repos
+ Sean Owen <srowen@gmail.com>
+ 2014-08-07 00:04:18 -0700
+ Commit: d6cd6fd0, github.com/apache/spark/pull/1828
+
+ [SPARK-2851] [mllib] DecisionTree Python consistency update
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-06 22:58:59 -0700
+ Commit: c9f0944, github.com/apache/spark/pull/1798
+
+ [SPARK-2887] fix bug of countApproxDistinct() when have more than one partition
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-06 21:22:13 -0700
+ Commit: cc8a7e9, github.com/apache/spark/pull/1812
+
+ Updating versions for Spark 1.1.0
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-06 19:11:39 -0700
+ Commit: cf35b56
+
+ HOTFIX: Support custom Java 7 location
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-06 18:45:03 -0700
+ Commit: 53fa048
+
+ SPARK-2879 [BUILD] Use HTTPS to access Maven Central and other repos
+ Sean Owen <srowen@gmail.com>
+ 2014-08-06 18:13:35 -0700
+ Commit: 40284a9, github.com/apache/spark/pull/1805
+
+ [SPARK-2583] ConnectionManager error reporting
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>, Josh Rosen <joshrosen@apache.org>
+ 2014-08-06 17:27:55 -0700
+ Commit: 3f92ce4, github.com/apache/spark/pull/1758
+
+ SPARK-2882: Spark build now checks local maven cache for dependencies
+ Gregory Owen <greowen@gmail.com>
+ 2014-08-06 16:52:00 -0700
+ Commit: c2ae0b0, github.com/apache/spark/pull/1818
+
+ [PySpark] Add blanklines to Python docstrings so example code renders correctly
+ RJ Nowling <rnowling@gmail.com>
+ 2014-08-06 14:12:21 -0700
+ Commit: a314e29, github.com/apache/spark/pull/1808
+
+ [SPARK-2852][MLLIB] API consistency for `mllib.feature`
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-06 14:07:51 -0700
+ Commit: e654cfd, github.com/apache/spark/pull/1807
+
+ SPARK-2566. Update ShuffleWriteMetrics incrementally
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-08-06 13:10:33 -0700
+ Commit: a65c9ac, github.com/apache/spark/pull/1481
+
+ [SPARK-2627] [PySpark] have the build enforce PEP 8 automatically
+ Nicholas Chammas <nicholas.chammas@gmail.com>, nchammas <nicholas.chammas@gmail.com>
+ 2014-08-06 12:58:24 -0700
+ Commit: 4c19614, github.com/apache/spark/pull/1744
+
+ [SPARK-2678][Core][SQL] A workaround for SPARK-2678
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-06 12:28:35 -0700
+ Commit: cf8e7fd, github.com/apache/spark/pull/1801
+
+ [SPARK-2875] [PySpark] [SQL] handle null in schemaRDD()
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-06 11:08:12 -0700
+ Commit: 27a8d4c, github.com/apache/spark/pull/1802
+
+ [SPARK-2157] Enable tight firewall rules for Spark
+ Andrew Or <andrewor14@gmail.com>, Andrew Ash <andrew@andrewash.com>
+ 2014-08-06 00:07:40 -0700
+ Commit: 31090e4, github.com/apache/spark/pull/1777
+
+ [SPARK-1022][Streaming][HOTFIX] Fixed zookeeper dependency of Kafka
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-08-05 23:41:34 -0700
+ Commit: 5b4bc84, github.com/apache/spark/pull/1797
+
+ [MLlib] Use this.type as return type in k-means' builder pattern
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-08-05 23:32:29 -0700
+ Commit: aec217a, github.com/apache/spark/pull/1796
+
+ SPARK-2294: fix locality inversion bug in TaskManager
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-08-05 23:02:58 -0700
+ Commit: 1da2fdf, github.com/apache/spark/pull/1313
+
+ [SQL] Fix logging warn -> debug
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-05 22:30:32 -0700
+ Commit: 0482055, github.com/apache/spark/pull/1800
+
+ [SQL] Tighten the visibility of various SQLConf methods and renamed setter/getters
+ Reynold Xin <rxin@apache.org>
+ 2014-08-05 22:29:19 -0700
+ Commit: 4f0b4f4, github.com/apache/spark/pull/1794
+
+ [SPARK-2806] core - upgrade to json4s-jackson 3.2.10
+ Anand Avati <avati@redhat.com>
+ 2014-08-05 21:59:10 -0700
+ Commit: 6da8f41, github.com/apache/spark/pull/1702
+
+ [SPARK-2866][SQL] Support attributes in ORDER BY that aren't in SELECT
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-05 20:55:02 -0700
+ Commit: 936f61e, github.com/apache/spark/pull/1795
+
+ [SPARK-2854][SQL] Finalize _acceptable_types in pyspark.sql
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-05 18:56:10 -0700
+ Commit: a10e1b0, github.com/apache/spark/pull/1793
+
+ [SPARK-2650][SQL] Try to partially fix SPARK-2650 by adjusting initial buffer size and reducing memory allocation
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-05 18:50:37 -0700
+ Commit: 4233b02, github.com/apache/spark/pull/1769
+
+ [sql] rename project name in pom.xml of hive-thriftserver module
+ wangfei <wangfei1@huawei.com>
+ 2014-08-05 18:30:02 -0700
+ Commit: 152e36c, github.com/apache/spark/pull/1789
+
+ SPARK-2869 - Fix tiny bug in JdbcRdd for closing jdbc connection
+ Stephen Boesch <javadba>, Stephen Boesch <javadba@gmail.com>
+ 2014-08-05 18:18:08 -0700
+ Commit: 58247a8, github.com/apache/spark/pull/1792
+
+ [SPARK-2550][MLLIB][APACHE SPARK] Support regularization and intercept in pyspark's linear methods
+ Michael Giannakopoulos <miccagiann@gmail.com>
+ 2014-08-05 16:30:32 -0700
+ Commit: 672904e, github.com/apache/spark/pull/1775
+
+ [SPARK-2503] Lower shuffle output buffer (spark.shuffle.file.buffer.kb) to 32KB.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-05 16:24:50 -0700
+ Commit: 0172277, github.com/apache/spark/pull/1781
+
+ [SPARK-2856] Decrease initial buffer size for Kryo to 64KB.
+ Reynold Xin <rxin@apache.org>
+ 2014-08-05 01:30:46 -0700
+ Commit: 5081b0d, github.com/apache/spark/pull/1780
+
+ [SPARK-2864][MLLIB] fix random seed in word2vec; move model to local
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-05 16:22:41 -0700
+ Commit: e77fa81, github.com/apache/spark/pull/1790
+
+ SPARK-1680: use configs for specifying environment variables on YARN
+ Thomas Graves <tgraves@apache.org>
+ 2014-08-05 15:57:32 -0500
+ Commit: 7b798e1, github.com/apache/spark/pull/1512
+
+ SPARK-2380: Support displaying accumulator values in the web UI
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-05 13:08:23 -0700
+ Commit: 46b6983, github.com/apache/spark/pull/1309
+
+ [SPARK-2859] Update url of Kryo project in related docs
+ Guancheng (G.C.) Chen <chenguancheng@gmail.com>
+ 2014-08-05 11:50:08 -0700
+ Commit: 0f541ab, github.com/apache/spark/pull/1782
+
+ [SPARK-2860][SQL] Fix coercion of CASE WHEN.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-05 11:17:50 -0700
+ Commit: 388ab53, github.com/apache/spark/pull/1785
+
+ SPARK-1890 and SPARK-1891- add admin and modify acls
+ Thomas Graves <tgraves@apache.org>
+ 2014-08-05 12:52:52 -0500
+ Commit: e3fe657, github.com/apache/spark/pull/1196
+
+ SPARK-1528 - spark on yarn, add support for accessing remote HDFS
+ Thomas Graves <tgraves@apache.org>
+ 2014-08-05 12:48:26 -0500
+ Commit: 6c0c65f, github.com/apache/spark/pull/1159
+
+ [SPARK-1022][Streaming] Add Kafka real unit test
+ jerryshao <saisai.shao@intel.com>
+ 2014-08-05 10:40:28 -0700
+ Commit: b92a450, github.com/apache/spark/pull/1751
+
+ [SPARK-1779] Throw an exception if memory fractions are not between 0 and 1
+ wangfei <scnbwf@yeah.net>, wangfei <wangfei1@huawei.com>
+ 2014-08-05 00:51:07 -0700
+ Commit: 075ba67, github.com/apache/spark/pull/714
+
+ [SPARK-2857] Correct properties to set Master / Worker ports
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-05 00:39:07 -0700
+ Commit: 12f99cf, github.com/apache/spark/pull/1779
+
+ SPARK-2711. Create a ShuffleMemoryManager to track memory for all spilling collections
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-04 23:41:03 -0700
+ Commit: d13d253, github.com/apache/spark/pull/1707
+
+ SPARK-2685. Update ExternalAppendOnlyMap to avoid buffer.remove()
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-04 23:27:53 -0700
+ Commit: a092285, github.com/apache/spark/pull/1773
+
+ [SPARK-2323] Exception in accumulator update should not crash DAGScheduler & SparkContext
+ Reynold Xin <rxin@apache.org>
+ 2014-08-04 20:39:18 -0700
+ Commit: 4ed7b5a, github.com/apache/spark/pull/1772
+
+ [SPARK-1687] [PySpark] fix unit tests related to pickable namedtuple
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-04 15:54:52 -0700
+ Commit: 2225d18, github.com/apache/spark/pull/1771
+
+ SPARK-2792. Fix reading too much or too little data from each stream in ExternalMap / Sorter
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-04 12:59:18 -0700
+ Commit: aa7a48e, github.com/apache/spark/pull/1722
+
+ [SPARK-1687] [PySpark] pickable namedtuple
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-04 12:13:41 -0700
+ Commit: bfd2f39, github.com/apache/spark/pull/1623
+
+ [MLlib] [SPARK-2510]Word2Vec: Distributed Representation of Words
+ Liquan Pei <lpei@gopivotal.com>, Xiangrui Meng <meng@databricks.com>, Liquan Pei <liquanpei@gmail.com>
+ 2014-08-03 23:55:58 -0700
+ Commit: 3823f6d, github.com/apache/spark/pull/1719
+
+ SPARK-2272 [MLlib] Feature scaling which standardizes the range of independent variables or features of data
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-08-03 21:39:21 -0700
+ Commit: 9aa1459, github.com/apache/spark/pull/1207
+
+ Fix some bugs with spaces in directory name.
+ Sarah Gerweck <sarah.a180@gmail.com>
+ 2014-08-03 19:47:05 -0700
+ Commit: 2152e24, github.com/apache/spark/pull/1756
+
+ [SPARK-2810] upgrade to scala-maven-plugin 3.2.0
+ Anand Avati <avati@redhat.com>
+ 2014-08-03 17:47:49 -0700
+ Commit: 4784d24, github.com/apache/spark/pull/1711
+
+ [SPARK-1740] [PySpark] kill the python worker
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-03 15:52:00 -0700
+ Commit: a4cdb77, github.com/apache/spark/pull/1643
+
+ [SPARK-2783][SQL] Basic support for analyze in HiveContext
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-03 14:54:41 -0700
+ Commit: 7c6afda, github.com/apache/spark/pull/1741
+
+ [SPARK-2814][SQL] HiveThriftServer2 throws NPE when executing native commands
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-03 12:34:46 -0700
+ Commit: 6ffdcc6, github.com/apache/spark/pull/1753
+
+ [SPARK-2784][SQL] Deprecate hql() method in favor of a config option, 'spark.sql.dialect'
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-03 12:28:29 -0700
+ Commit: c5ed1de, github.com/apache/spark/pull/1746
+
+ [SPARK-2197] [mllib] Java DecisionTree bug fix and easy-of-use
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-03 10:36:52 -0700
+ Commit: eaa9355, github.com/apache/spark/pull/1740
+
+ SPARK-2246: Add user-data option to EC2 scripts
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-08-03 10:25:59 -0700
+ Commit: 162fc95, github.com/apache/spark/pull/1186
+
+ SPARK-2712 - Add a small note to maven doc that mvn package must happen ...
+ Stephen Boesch <javadba@gmail.com>
+ 2014-08-03 10:19:04 -0700
+ Commit: 1992175, github.com/apache/spark/pull/1615
+
+ [Minor] Fixes on top of #1679
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-02 22:00:46 -0700
+ Commit: fb2a207, github.com/apache/spark/pull/1736
+
+ SPARK-2414 [BUILD] Add LICENSE entry for jquery
+ Sean Owen <srowen@gmail.com>
+ 2014-08-02 21:55:56 -0700
+ Commit: c137928, github.com/apache/spark/pull/1748
+
+ SPARK-2602 [BUILD] Tests steal focus under Java 6
+ Sean Owen <srowen@gmail.com>
+ 2014-08-02 21:44:19 -0700
+ Commit: 0d47bb6, github.com/apache/spark/pull/1747
+
+ [SPARK-2739][SQL] Rename registerAsTable to registerTempTable
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-02 18:27:04 -0700
+ Commit: 5b30e00, github.com/apache/spark/pull/1743
+
+ [SPARK-2797] [SQL] SchemaRDDs don't support unpersist()
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-02 17:55:22 -0700
+ Commit: 5ef8282, github.com/apache/spark/pull/1745
+
+ [SPARK-2729][SQL] Added test case for SPARK-2729
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-08-02 17:12:49 -0700
+ Commit: 460fad8, github.com/apache/spark/pull/1738
+
+ [SPARK-2785][SQL] Remove assertions that throw when users try unsupported Hive commands.
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-02 16:48:07 -0700
+ Commit: 4230df4, github.com/apache/spark/pull/1742
+
+ [SPARK-2097][SQL] UDF Support
+ Michael Armbrust <michael@databricks.com>
+ 2014-08-02 16:33:48 -0700
+ Commit: 3b9f25f, github.com/apache/spark/pull/1063
+
+ SPARK-2804: Remove scalalogging-slf4j dependency
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-02 13:55:28 -0700
+ Commit: 7924d72, github.com/apache/spark/pull/also
+
+ [SPARK-1981] Add AWS Kinesis streaming support
+ Chris Fregly <chris@fregly.com>
+ 2014-08-02 13:35:35 -0700
+ Commit: bb0ac6d, github.com/apache/spark/pull/1434
+
+ [SQL] Set outputPartitioning of BroadcastHashJoin correctly.
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-02 13:16:41 -0700
+ Commit: 91de0dc, github.com/apache/spark/pull/1735
+
+ [SPARK-2478] [mllib] DecisionTree Python API
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-02 13:07:17 -0700
+ Commit: 8d6ac2b, github.com/apache/spark/pull/1727
+
+ [HOTFIX] Do not throw NPE if spark.test.home is not set
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-02 12:11:50 -0700
+ Commit: e221108, github.com/apache/spark/pull/1739
+
+ MAINTENANCE: Automated closing of pull requests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-02 01:26:16 -0700
+ Commit: 87738bf, github.com/apache/spark/pull/706
+
+ HOTFIX: Fix concurrency issue in FlumePollingStreamSuite.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-02 01:11:03 -0700
+ Commit: 44460ba
+
+ HOTFIX: Fixing test error in maven for flume-sink.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-02 00:57:47 -0700
+ Commit: 25cad6a
+
+ [SPARK-1812] sql/catalyst - Provide explicit type information
+ Anand Avati <avati@redhat.com>
+ 2014-08-02 00:48:17 -0700
+ Commit: 08c095b, github.com/apache/spark/pull/1709
+
+ [SPARK-2454] Do not ship spark home to Workers
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-02 00:45:38 -0700
+ Commit: 148af60, github.com/apache/spark/pull/1734
+
+ [SPARK-2316] Avoid O(blocks) operations in listeners
+ Andrew Or <andrewor14@gmail.com>
+ 2014-08-01 23:56:24 -0700
+ Commit: d934801, github.com/apache/spark/pull/1679
+
+ Revert "[SPARK-1470][SPARK-1842] Use the scala-logging wrapper instead of the directly sfl4j api"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-08-01 23:55:30 -0700
+ Commit: dab3796
+
+ [SPARK-1470][SPARK-1842] Use the scala-logging wrapper instead of the directly sfl4j api
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-01 23:55:11 -0700
+ Commit: adc8303, github.com/apache/spark/pull/1369
+
+ StatCounter on NumPy arrays [PYSPARK][SPARK-2012]
+ Jeremy Freeman <the.freeman.lab@gmail.com>
+ 2014-08-01 22:33:25 -0700
+ Commit: 4bc3bb2, github.com/apache/spark/pull/1725
+
+ [SPARK-2801][MLlib]: DistributionGenerator renamed to RandomDataGenerator. RandomRDD is now of generic type
+ Burak <brkyvz@gmail.com>
+ 2014-08-01 22:32:12 -0700
+ Commit: fda4759, github.com/apache/spark/pull/1732
+
+ [SPARK-1580][MLLIB] Estimate ALS communication and computation costs.
+ Tor Myklebust <tmyklebu@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-08-01 21:25:02 -0700
+ Commit: e25ec06, github.com/apache/spark/pull/493
+
+ [SPARK-2550][MLLIB][APACHE SPARK] Support regularization and intercept in pyspark's linear methods.
+ Michael Giannakopoulos <miccagiann@gmail.com>
+ 2014-08-01 21:00:31 -0700
+ Commit: c281189, github.com/apache/spark/pull/1624
+
+ Streaming mllib [SPARK-2438][MLLIB]
+ Jeremy Freeman <the.freeman.lab@gmail.com>, freeman <the.freeman.lab@gmail.com>
+ 2014-08-01 20:10:26 -0700
+ Commit: f6a1899, github.com/apache/spark/pull/1361
+
+ [SPARK-2764] Simplify daemon.py process structure
+ Josh Rosen <joshrosen@apache.org>
+ 2014-08-01 19:38:21 -0700
+ Commit: e8e0fd6, github.com/apache/spark/pull/1680
+
+ [SPARK-2800]: Exclude scalastyle-output.xml Apache RAT checks
+ GuoQiang Li <witgo@qq.com>
+ 2014-08-01 19:35:16 -0700
+ Commit: a38d3c9, github.com/apache/spark/pull/1729
+
+ [SPARK-2116] Load spark-defaults.conf from SPARK_CONF_DIR if set
+ Albert Chu <chu11@llnl.gov>
+ 2014-08-01 19:00:38 -0700
+ Commit: 0da07da, github.com/apache/spark/pull/1059
+
+ [SPARK-2212][SQL] Hash Outer Join (follow-up bug fix).
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-01 18:52:01 -0700
+ Commit: 3822f33, github.com/apache/spark/pull/1721
+
+ [SPARK-2010] [PySpark] [SQL] support nested structure in SchemaRDD
+ Davies Liu <davies.liu@gmail.com>
+ 2014-08-01 18:47:41 -0700
+ Commit: 880eabe, github.com/apache/spark/pull/1598
+
+ [SPARK-2796] [mllib] DecisionTree bug fix: ordered categorical features
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-08-01 15:52:21 -0700
+ Commit: 7058a53, github.com/apache/spark/pull/1720
+
+ [SPARK-2786][mllib] Python correlations
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-08-01 15:02:17 -0700
+ Commit: d88e695, github.com/apache/spark/pull/1713
+
+ SPARK-2791: Fix committing, reverting and state tracking in shuffle file consolidation
+ Aaron Davidson <aaron@databricks.com>
+ 2014-08-01 13:57:19 -0700
+ Commit: 78f2af5, github.com/apache/spark/pull/1678
+
+ [SPARK-2379] Fix the bug that streaming's receiver may fall into a dead loop
+ joyyoj <sunshch@gmail.com>
+ 2014-08-01 13:41:55 -0700
+ Commit: b270309, github.com/apache/spark/pull/1694
+
+ SPARK-1612: Fix potential resource leaks
+ zsxwing <zsxwing@gmail.com>
+ 2014-08-01 13:25:04 -0700
+ Commit: f5d9bea, github.com/apache/spark/pull/535
+
+ [SPARK-2490] Change recursive visiting on RDD dependencies to iterative approach
+ Liang-Chi Hsieh <viirya@gmail.com>
+ 2014-08-01 12:12:30 -0700
+ Commit: baf9ce1, github.com/apache/spark/pull/1418
+
+ [SPARK-695] In DAGScheduler's getPreferredLocs, track set of visited partitions.
+ Aaron Staple <aaron.staple@gmail.com>
+ 2014-08-01 12:04:04 -0700
+ Commit: eb5bdca, github.com/apache/spark/pull/1362
+
+ [SQL] Documentation: Explain cacheTable command
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-08-01 11:46:13 -0700
+ Commit: c82fe47, github.com/apache/spark/pull/1681
+
+ [SPARK-2767] [SQL] SparkSQL CLI doens't output error message if query failed.
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-08-01 11:42:05 -0700
+ Commit: c0b47ba, github.com/apache/spark/pull/1686
+
+ [SPARK-2729] [SQL] Forgot to match Timestamp type in ColumnBuilder
+ chutium <teng.qiu@gmail.com>
+ 2014-08-01 11:31:44 -0700
+ Commit: 580c701, github.com/apache/spark/pull/1636
+
+ [SQL][SPARK-2212]Hash Outer Join
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-08-01 11:27:12 -0700
+ Commit: 4415722, github.com/apache/spark/pull/1147
+
+ [SPARK-2179][SQL] A minor refactoring Java data type APIs (2179 follow-up).
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-08-01 11:14:53 -0700
+ Commit: c41fdf0, github.com/apache/spark/pull/1712
+
+ SPARK-2099. Report progress while task is running.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-08-01 11:08:39 -0700
+ Commit: 8d338f6, github.com/apache/spark/pull/1056
+
+ [HOTFIX] downgrade breeze version to 0.7
+ Xiangrui Meng <meng@databricks.com>
+ 2014-08-01 10:00:46 -0700
+ Commit: 5328c0a, github.com/apache/spark/pull/1718
+
+ [SPARK-1997] update breeze to version 0.8.1
+ witgo <witgo@qq.com>
+ 2014-08-01 07:47:44 -0700
+ Commit: 0dacb1a, github.com/apache/spark/pull/940
+
+ SPARK-2768 [MLLIB] Add product, user recommend method to MatrixFactorizationModel
+ Sean Owen <srowen@gmail.com>
+ 2014-08-01 07:32:53 -0700
+ Commit: 82d209d, github.com/apache/spark/pull/1687
+
+ [SPARK-2103][Streaming] Change to ClassTag for KafkaInputDStream and fix reflection issue
+ jerryshao <saisai.shao@intel.com>
+ 2014-08-01 04:32:46 -0700
+ Commit: a32f0fb, github.com/apache/spark/pull/1508
+
+ [Spark 2557] fix LOCAL_N_REGEX in createTaskScheduler and make local-n and local-n-failures consistent
+ Ye Xianjin <advancedxy@gmail.com>
+ 2014-08-01 00:34:39 -0700
+ Commit: 284771e, github.com/apache/spark/pull/1464
+
+ SPARK-2134: Report metrics before application finishes
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-08-01 00:33:15 -0700
+ Commit: f1957e1, github.com/apache/spark/pull/1076
+
+ SPARK-983. Support external sorting in sortByKey()
+ Matei Zaharia <matei@databricks.com>
+ 2014-08-01 00:16:18 -0700
+ Commit: 72e3369, github.com/apache/spark/pull/931
+
+ [SPARK-2670] FetchFailedException should be thrown when local fetch has failed
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-08-01 00:01:30 -0700
+ Commit: 8ff4417, github.com/apache/spark/pull/1578
+
+ SPARK-2738. Remove redundant imports in BlockManagerSuite
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-31 23:12:38 -0700
+ Commit: cb9e7d5, github.com/apache/spark/pull/1642
+
+ SPARK-2632, SPARK-2576. Fixed by only importing what is necessary during class definition.
+ Prashant Sharma <scrapcodes@gmail.com>, Yin Huai <huai@cse.ohio-state.edu>, Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-31 22:57:13 -0700
+ Commit: 1499101, github.com/apache/spark/pull/1635
+
+ [SPARK-2702][Core] Upgrade Tachyon dependency to 0.5.0
+ Haoyuan Li <haoyuan@cs.berkeley.edu>
+ 2014-07-31 22:53:42 -0700
+ Commit: 2cdc3e5, github.com/apache/spark/pull/1651
+
+ [SPARK-2782][mllib] Bug fix for getRanks in SpearmanCorrelation
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-31 21:23:35 -0700
+ Commit: c475540, github.com/apache/spark/pull/1710
+
+ [SPARK-2777][MLLIB] change ALS factors storage level to MEMORY_AND_DISK
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-31 21:14:08 -0700
+ Commit: b190083, github.com/apache/spark/pull/1700
+
+ SPARK-2766: ScalaReflectionSuite throw an llegalArgumentException in JDK 6
+ GuoQiang Li <witgo@qq.com>
+ 2014-07-31 21:06:57 -0700
+ Commit: 9998efa, github.com/apache/spark/pull/1683
+
+ [SPARK-2779] [SQL] asInstanceOf[Map[...]] should use scala.collection.Map instead of scala.collection.immutable.Map
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-31 21:02:11 -0700
+ Commit: 9632719, github.com/apache/spark/pull/1705
+
+ [SPARK-2756] [mllib] Decision tree bug fixes
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-07-31 20:51:48 -0700
+ Commit: b124de5, github.com/apache/spark/pull/1673
+
+ [SPARK-2724] Python version of RandomRDDGenerators
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-31 20:32:57 -0700
+ Commit: d843014, github.com/apache/spark/pull/1628
+
+ [SPARK-2531 & SPARK-2436] [SQL] Optimize the BuildSide when planning BroadcastNestedLoopJoin.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-07-31 19:32:16 -0700
+ Commit: 8f51491, github.com/apache/spark/pull/1448
+
+ SPARK-2282: Reuse Socket for sending accumulator updates to Pyspark
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-31 15:31:53 -0700
+ Commit: ef4ff00, github.com/apache/spark/pull/1503
+
+ SPARK-2740: allow user to specify ascending and numPartitions for sortBy...
+ Rui Li <rui.li@intel.com>
+ 2014-07-31 15:07:26 -0700
+ Commit: 492a195, github.com/apache/spark/pull/1645
+
+ Docs: monitoring, streaming programming guide
+ kballou <kballou@devnulllabs.io>
+ 2014-07-31 14:58:52 -0700
+ Commit: cc82050, github.com/apache/spark/pull/1662
+
+ Improvements to merge_spark_pr.py
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-31 14:35:09 -0700
+ Commit: e021362, github.com/apache/spark/pull/1668
+
+ [SPARK-2523] [SQL] Hadoop table scan bug fixing (fix failing Jenkins maven test)
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-31 13:05:24 -0700
+ Commit: 49b3612, github.com/apache/spark/pull/1669
+
+ [SPARK-2511][MLLIB] add HashingTF and IDF
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-31 12:55:00 -0700
+ Commit: dc0865b, github.com/apache/spark/pull/1671
+
+ SPARK-2646. log4j initialization not quite compatible with log4j 2.x
+ Sean Owen <srowen@gmail.com>
+ 2014-07-31 12:26:36 -0700
+ Commit: e5749a1, github.com/apache/spark/pull/1547
+
+ SPARK-2749 [BUILD] Part 2. Fix a follow-on scalastyle error
+ Sean Owen <srowen@gmail.com>
+ 2014-07-31 12:18:40 -0700
+ Commit: 4dbabb3, github.com/apache/spark/pull/1690
+
+ SPARK-2664. Deal with `--conf` options in spark-submit that relate to fl...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-31 11:51:20 -0700
+ Commit: f68105d, github.com/apache/spark/pull/1665
+
+ SPARK-2028: Expose mapPartitionsWithInputSplit in HadoopRDD
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-31 11:35:38 -0700
+ Commit: f193312, github.com/apache/spark/pull/973
+
+ [SPARK-2397][SQL] Deprecate LocalHiveContext
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-31 11:26:43 -0700
+ Commit: 72cfb13, github.com/apache/spark/pull/1641
+
+ [SPARK-2743][SQL] Resolve original attributes in ParquetTableScan
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-31 11:15:25 -0700
+ Commit: 3072b96, github.com/apache/spark/pull/1647
+
+ [SPARK-2762] SparkILoop leaks memory in multi-repl configurations
+ Timothy Hunter <timhunter@databricks.com>
+ 2014-07-31 10:25:40 -0700
+ Commit: 92ca910, github.com/apache/spark/pull/1674
+
+ automatically set master according to `spark.master` in `spark-defaults....
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-07-30 23:37:25 -0700
+ Commit: 669e3f0, github.com/apache/spark/pull/1644
+
+ [SPARK-2497] Included checks for module symbols too.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-30 22:46:30 -0700
+ Commit: 5a110da, github.com/apache/spark/pull/1463
+
+ [SPARK-2737] Add retag() method for changing RDDs' ClassTags.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-30 22:40:57 -0700
+ Commit: 4fb2593, github.com/apache/spark/pull/1639
+
+ [SPARK-2340] Resolve event logging and History Server paths properly
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-30 21:57:32 -0700
+ Commit: a7c305b, github.com/apache/spark/pull/1280
+
+ Required AM memory is "amMem", not "args.amMemory"
+ derek ma <maji3@asiainfo-linkage.com>
+ 2014-07-30 21:37:59 -0700
+ Commit: 118c1c4, github.com/apache/spark/pull/1494
+
+ [SPARK-2758] UnionRDD's UnionPartition should not reference parent RDDs
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 21:30:13 -0700
+ Commit: 894d48f, github.com/apache/spark/pull/1675
+
+ SPARK-2045 Sort-based shuffle
+ Matei Zaharia <matei@databricks.com>
+ 2014-07-30 18:07:59 -0700
+ Commit: e966284, github.com/apache/spark/pull/1499
+
+ Update DecisionTreeRunner.scala
+ strat0sphere <stratos.dimopoulos@gmail.com>
+ 2014-07-30 17:57:50 -0700
+ Commit: da50176, github.com/apache/spark/pull/1676
+
+ SPARK-2341 [MLLIB] loadLibSVMFile doesn't handle regression datasets
+ Sean Owen <srowen@gmail.com>
+ 2014-07-30 17:34:32 -0700
+ Commit: e9b275b, github.com/apache/spark/pull/1663
+
+ [SPARK-2734][SQL] Remove tables from cache when DROP TABLE is run.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-30 17:30:51 -0700
+ Commit: 88a519d, github.com/apache/spark/pull/1650
+
+ SPARK-2741 - Publish version of spark assembly which does not contain Hive
+ Brock Noland <brock@apache.org>
+ 2014-07-30 17:04:30 -0700
+ Commit: 2ac37db, github.com/apache/spark/pull/1667
+
+ SPARK-2749 [BUILD]. Spark SQL Java tests aren't compiling in Jenkins' Maven builds; missing junit:junit dep
+ Sean Owen <srowen@gmail.com>
+ 2014-07-30 15:04:33 -0700
+ Commit: 6ab96a6, github.com/apache/spark/pull/1660
+
+ Properly pass SBT_MAVEN_PROFILES into sbt.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 14:31:20 -0700
+ Commit: 2f4b170
+
+ Set AMPLAB_JENKINS_BUILD_PROFILE.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 14:08:24 -0700
+ Commit: 1097327
+
+ Wrap JAR_DL in dev/check-license.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 13:42:43 -0700
+ Commit: 7c7ce54
+
+ [SPARK-2024] Add saveAsSequenceFile to PySpark
+ Kan Zhang <kzhang@apache.org>
+ 2014-07-30 13:19:05 -0700
+ Commit: 94d1f46, github.com/apache/spark/pull/1338
+
+ dev/check-license wrap folders in quotes.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 13:17:14 -0700
+ Commit: 437dc8c
+
+ [SQL] Fix compiling of catalyst docs.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-30 13:11:09 -0700
+ Commit: 2248891, github.com/apache/spark/pull/1653
+
+ More wrapping FWDIR in quotes.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 13:04:20 -0700
+ Commit: 0feb349
+
+ Wrap FWDIR in quotes in dev/check-license.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 12:33:42 -0700
+ Commit: 95cf203
+
+ Wrap FWDIR in quotes.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 12:24:35 -0700
+ Commit: f2eb84f
+
+ [SPARK-2746] Set SBT_MAVEN_PROFILES only when it is not set explicitly by the user.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 11:45:24 -0700
+ Commit: ff511ba, github.com/apache/spark/pull/1655
+
+ [SPARK-2544][MLLIB] Improve ALS algorithm resource usage
+ GuoQiang Li <witgo@qq.com>, witgo <witgo@qq.com>
+ 2014-07-30 11:00:11 -0700
+ Commit: fc47bb6, github.com/apache/spark/pull/929
+
+ Avoid numerical instability
+ Naftali Harris <naftaliharris@gmail.com>
+ 2014-07-30 09:56:59 -0700
+ Commit: e3d85b7, github.com/apache/spark/pull/1652
+
+ [SPARK-2747] git diff --dirstat can miss sql changes and not run Hive tests
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 09:28:53 -0700
+ Commit: 3bc3f18, github.com/apache/spark/pull/1656
+
+ [SPARK-2521] Broadcast RDD object (instead of sending it along with every task)
+ Reynold Xin <rxin@apache.org>
+ 2014-07-30 09:27:43 -0700
+ Commit: 774142f, github.com/apache/spark/pull/1498
+
+ SPARK-2748 [MLLIB] [GRAPHX] Loss of precision for small arguments to Math.exp, Math.log
+ Sean Owen <srowen@gmail.com>
+ 2014-07-30 08:55:15 -0700
+ Commit: ee07541, github.com/apache/spark/pull/1659
+
+ SPARK-2543: Allow user to set maximum Kryo buffer size
+ Koert Kuipers <koert@tresata.com>
+ 2014-07-30 00:18:59 -0700
+ Commit: 7c5fc28, github.com/apache/spark/pull/735
+
+ [SPARK-2179][SQL] Public API for DataTypes and Schema
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-30 00:15:31 -0700
+ Commit: 7003c16, github.com/apache/spark/pull/1346
+
+ [SPARK-2260] Fix standalone-cluster mode, which was broken
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-29 23:52:09 -0700
+ Commit: 4ce92cc, github.com/apache/spark/pull/1538
+
+ [SQL] Handle null values in debug()
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-29 22:42:54 -0700
+ Commit: 077f633, github.com/apache/spark/pull/1646
+
+ [SPARK-2568] RangePartitioner should run only one job if data is balanced
+ Xiangrui Meng <meng@databricks.com>, Reynold Xin <rxin@apache.org>
+ 2014-07-29 22:16:20 -0700
+ Commit: 2e6efca, github.com/apache/spark/pull/1562
+
+ [SPARK-2054][SQL] Code Generation for Expression Evaluation
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-29 20:58:05 -0700
+ Commit: 8446746, github.com/apache/spark/pull/993
+
+ [SPARK-2305] [PySpark] Update Py4J to version 0.8.2.1
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-29 19:02:06 -0700
+ Commit: 22649b6, github.com/apache/spark/pull/1626
+
+ [SPARK-2631][SQL] Use SQLConf to configure in-memory columnar caching
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-29 18:20:51 -0700
+ Commit: 86534d0, github.com/apache/spark/pull/1638
+
+ [SPARK-2716][SQL] Don't check resolved for having filters.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-29 18:14:20 -0700
+ Commit: 39b8193, github.com/apache/spark/pull/1640
+
+ MAINTENANCE: Automated closing of pull requests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-29 17:52:48 -0700
+ Commit: 2c35666, github.com/apache/spark/pull/740
+
+ [SPARK-2393][SQL] Cost estimation optimization framework for Catalyst logical plans & sample usage.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-07-29 15:32:50 -0700
+ Commit: c7db274, github.com/apache/spark/pull/1238
+
+ [SPARK-2082] stratified sampling in PairRDDFunctions that guarantees exact sample size
+ Doris Xin <doris.s.xin@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-07-29 12:49:44 -0700
+ Commit: dc96536, github.com/apache/spark/pull/1025
+
+ [SPARK-2674] [SQL] [PySpark] support datetime type for SchemaRDD
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-29 12:31:39 -0700
+ Commit: f0d880e, github.com/apache/spark/pull/1601
+
+ [SPARK-2730][SQL] When retrieving a value from a Map, GetItem evaluates key twice
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-29 12:23:34 -0700
+ Commit: e364348, github.com/apache/spark/pull/1637
+
+ [SQL]change some test lists
+ Daoyuan <daoyuan.wang@intel.com>
+ 2014-07-29 12:22:48 -0700
+ Commit: 0c5c6a6, github.com/apache/spark/pull/1634
+
+ [STREAMING] SPARK-1729. Make Flume pull data from source, rather than the current pu...
+ Hari Shreedharan <harishreedharan@gmail.com>, Hari Shreedharan <hshreedharan@apache.org>, Tathagata Das <tathagata.das1565@gmail.com>, harishreedharan <hshreedharan@cloudera.com>
+ 2014-07-29 11:11:29 -0700
+ Commit: 800ecff, github.com/apache/spark/pull/807
+
+ Minor indentation and comment typo fixes.
+ Aaron Staple <astaple@gmail.com>
+ 2014-07-29 01:35:26 -0700
+ Commit: fc4d057, github.com/apache/spark/pull/1630
+
+ [SPARK-2174][MLLIB] treeReduce and treeAggregate
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-29 01:16:41 -0700
+ Commit: 20424da, github.com/apache/spark/pull/1110
+
+ [SPARK-2726] and [SPARK-2727] Remove SortOrder and do in-place sort.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-29 01:12:44 -0700
+ Commit: 96ba04b, github.com/apache/spark/pull/1631
+
+ [SPARK-791] [PySpark] fix pickle itemgetter with cloudpickle
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-29 01:02:18 -0700
+ Commit: 92ef026, github.com/apache/spark/pull/1627
+
+ [SPARK-2580] [PySpark] keep silent in worker if JVM close the socket
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-29 00:15:45 -0700
+ Commit: ccd5ab5, github.com/apache/spark/pull/1625
+
+ Excess judgment
+ Yadong Qi <qiyadong2010@gmail.com>
+ 2014-07-28 21:39:02 -0700
+ Commit: 16ef4d1, github.com/apache/spark/pull/1629
+
+ Use commons-lang3 in SignalLogger rather than commons-lang
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-28 13:37:44 -0700
+ Commit: 39ab87b, github.com/apache/spark/pull/1621
+
+ [SPARK-2410][SQL] Merging Hive Thrift/JDBC server (with Maven profile fix)
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-28 12:07:30 -0700
+ Commit: a7a9d14, github.com/apache/spark/pull/1620
+
+ [SPARK-2479][MLlib] Comparing floating-point numbers using relative error in UnitTests
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-07-28 11:34:19 -0700
+ Commit: 255b56f, github.com/apache/spark/pull/1425
+
+ [SPARK-2523] [SQL] Hadoop table scan bug fixing
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-07-28 10:59:53 -0700
+ Commit: 2b8d89e, github.com/apache/spark/pull/1439
+
+ [SPARK-1550] [PySpark] Allow SparkContext creation after failed attempts
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-27 22:54:43 -0700
+ Commit: a7d145e, github.com/apache/spark/pull/1606
+
+ SPARK-2651: Add maven scalastyle plugin
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-07-27 18:50:32 -0700
+ Commit: d7eac4c, github.com/apache/spark/pull/1550
+
+ Revert "[SPARK-2410][SQL] Merging Hive Thrift/JDBC server"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-27 18:46:58 -0700
+ Commit: e5bbce9
+
+ [SPARK-2514] [mllib] Random RDD generator
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-27 16:16:39 -0700
+ Commit: 81fcdd2, github.com/apache/spark/pull/1520
+
+ [SPARK-1777] Prevent OOMs from single partitions
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-27 16:08:16 -0700
+ Commit: ecf30ee, github.com/apache/spark/pull/1165
+
+ [SPARK-2410][SQL] Merging Hive Thrift/JDBC server
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-27 13:03:38 -0700
+ Commit: f6ff2a6, github.com/apache/spark/pull/1600
+
+ [SPARK-2705][CORE] Fixed stage description in stage info page
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-27 12:35:21 -0700
+ Commit: 2bbf235, github.com/apache/spark/pull/1524
+
+ SPARK-2684: Update ExternalAppendOnlyMap to take an iterator as input
+ Matei Zaharia <matei@databricks.com>
+ 2014-07-27 11:20:20 -0700
+ Commit: 9857053, github.com/apache/spark/pull/1607
+
+ [SPARK-2679] [MLLib] Ser/De for Double
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-27 07:21:07 -0700
+ Commit: 3a69c72, github.com/apache/spark/pull/1581
+
+ [SPARK-2361][MLLIB] Use broadcast instead of serializing data directly into task closure
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-26 22:56:07 -0700
+ Commit: aaf2b73, github.com/apache/spark/pull/1427
+
+ SPARK-2680: Lower spark.shuffle.memoryFraction to 0.2 by default
+ Matei Zaharia <matei@databricks.com>
+ 2014-07-26 22:44:17 -0700
+ Commit: b547f69, github.com/apache/spark/pull/1593
+
+ [SPARK-2601] [PySpark] Fix Py4J error when transforming pickleFiles
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-26 17:37:05 -0700
+ Commit: ba46bbe, github.com/apache/spark/pull/1605
+
+ [SPARK-2704] Name threads in ConnectionManager and mark them as daemon.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-26 15:00:32 -0700
+ Commit: 1290164, github.com/apache/spark/pull/1604
+
+ [SPARK-2279] Added emptyRDD method to Java API
+ bpaulin <bob@bobpaulin.com>
+ 2014-07-26 10:27:09 -0700
+ Commit: c183b92, github.com/apache/spark/pull/1597
+
+ [SPARK-2652] [PySpark] Turning some default configs for PySpark
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-26 01:07:08 -0700
+ Commit: 75663b5, github.com/apache/spark/pull/1568
+
+ [SPARK-2696] Reduce default value of spark.serializer.objectStreamReset
+ Hossein <hossein@databricks.com>
+ 2014-07-26 01:04:56 -0700
+ Commit: 66f26a4, github.com/apache/spark/pull/1595
+
+ [SPARK-1458] [PySpark] Expose sc.version in Java and PySpark
+ Josh Rosen <joshrosen@apache.org>
+ 2014-07-26 00:54:05 -0700
+ Commit: cf3e9fd, github.com/apache/spark/pull/1596
+
+ [SPARK-2659][SQL] Fix division semantics for hive
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-25 19:17:49 -0700
+ Commit: 8904791, github.com/apache/spark/pull/1557
+
+ Part of [SPARK-2456] Removed some HashMaps from DAGScheduler by storing information in Stage.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-25 18:45:02 -0700
+ Commit: 9d8666c, github.com/apache/spark/pull/1561
+
+ Revert "[SPARK-2410][SQL] Merging Hive Thrift/JDBC server"
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-25 15:36:57 -0700
+ Commit: afd757a, github.com/apache/spark/pull/1594
+
+ [SPARK-1726] [SPARK-2567] Eliminate zombie stages in UI.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-07-25 15:14:13 -0700
+ Commit: 37ad3b7, github.com/apache/spark/pull/1566
+
+ [SPARK-2125] Add sort flag and move sort into shuffle implementations
+ jerryshao <saisai.shao@intel.com>
+ 2014-07-25 14:34:38 -0700
+ Commit: 47b6b38, github.com/apache/spark/pull/1210
+
+ [SQL]Update HiveMetastoreCatalog.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-07-25 13:59:45 -0700
+ Commit: ab3c6a4, github.com/apache/spark/pull/1569
+
+ [SPARK-2682] Javadoc generated from Scala source code is not in javadoc's index
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-25 13:00:13 -0700
+ Commit: a19d8c8, github.com/apache/spark/pull/1584
+
+ [SPARK-2410][SQL] Merging Hive Thrift/JDBC server
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-25 12:20:49 -0700
+ Commit: 06dc0d2, github.com/apache/spark/pull/1399
+
+ [SPARK-2683] unidoc failed because org.apache.spark.util.CallSite uses Java keywords as value names
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-25 11:14:51 -0700
+ Commit: 32bcf9a, github.com/apache/spark/pull/1585
+
+ replace println to log4j
+ fireflyc <fireflyc@126.com>
+ 2014-07-25 10:47:52 -0700
+ Commit: a2715cc, github.com/apache/spark/pull/1372
+
+ [SPARK-2665] [SQL] Add EqualNS & Unit Tests
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-07-25 01:30:22 -0700
+ Commit: 184aa1c, github.com/apache/spark/pull/1570
+
+ [SPARK-2529] Clean closures in foreach and foreachPartition.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-25 01:10:05 -0700
+ Commit: eb82abd, github.com/apache/spark/pull/1583
+
+ SPARK-2657 Use more compact data structures than ArrayBuffer in groupBy & cogroup
+ Matei Zaharia <matei@databricks.com>
+ 2014-07-25 00:32:32 -0700
+ Commit: 8529ced, github.com/apache/spark/pull/1555
+
+ [SPARK-2656] Python version of stratified sampling
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-24 23:42:08 -0700
+ Commit: 2f75a4a, github.com/apache/spark/pull/1554
+
+ [SPARK-2538] [PySpark] Hash based disk spilling aggregation
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-24 22:53:47 -0700
+ Commit: 14174ab, github.com/apache/spark/pull/1460
+
+ [SPARK-2014] Make PySpark store RDDs in MEMORY_ONLY_SER with compression by default
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-24 18:15:37 -0700
+ Commit: eff9714, github.com/apache/spark/pull/1051
+
+ [SPARK-2464][Streaming] Fixed Twitter stream stopping bug
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-07-24 15:59:09 -0700
+ Commit: a45d548, github.com/apache/spark/pull/1577
+
+ SPARK-2250: show stage RDDs in UI
+ Neville Li <neville@spotify.com>
+ 2014-07-24 14:13:00 -0700
+ Commit: fec641b, github.com/apache/spark/pull/1188
+
+ [SPARK-2037]: yarn client mode doesn't support spark.yarn.max.executor.failures
+ GuoQiang Li <witgo@qq.com>
+ 2014-07-24 14:46:10 -0500
+ Commit: 323a83c, github.com/apache/spark/pull/1180
+
+ [SPARK-2479 (partial)][MLLIB] fix binary metrics unit tests
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-24 12:37:02 -0700
+ Commit: c960b50, github.com/apache/spark/pull/1576
+
+ [SPARK-2603][SQL] Remove unnecessary toMap and toList in converting Java collections to Scala collections JsonRDD.scala
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-24 11:19:19 -0700
+ Commit: b352ef1, github.com/apache/spark/pull/1504
+
+ [Build] SPARK-2619: Configurable filemode for the spark/bin folder in debian package
+ tzolov <christian.tzolov@gmail.com>
+ 2014-07-24 11:12:25 -0700
+ Commit: 9fd1414, github.com/apache/spark/pull/1531
+
+ SPARK-2150: Provide direct link to finished application UI in yarn resou...
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-07-24 09:31:04 -0500
+ Commit: 46e224a, github.com/apache/spark/pull/1094
+
+ [SPARK-2661][bagel]unpersist old processed rdd
+ Daoyuan <daoyuan.wang@intel.com>
+ 2014-07-24 00:09:36 -0700
+ Commit: 42dfab7, github.com/apache/spark/pull/1519
+
+ SPARK-2310. Support arbitrary Spark properties on the command line with ...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-23 23:09:25 -0700
+ Commit: e34922a, github.com/apache/spark/pull/1253
+
+ [SPARK-2658][SQL] Add rule for true = 1.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-23 22:52:49 -0700
+ Commit: 78d18fd, github.com/apache/spark/pull/1556
+
+ SPARK-2662: Fix NPE for JsonProtocol
+ GuoQiang Li <witgo@qq.com>
+ 2014-07-23 22:50:39 -0700
+ Commit: 9e7725c, github.com/apache/spark/pull/1511
+
+ Replace RoutingTableMessage with pair
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-07-23 20:11:28 -0700
+ Commit: 2d25e34, github.com/apache/spark/pull/1553
+
+ [SPARK-2484][SQL] Build should not run hivecompatibility tests by default.
+ witgo <witgo@qq.com>
+ 2014-07-23 18:17:05 -0700
+ Commit: 60f0ae3, github.com/apache/spark/pull/1403
+
+ [SPARK-2549] Functions defined inside of other functions trigger failures
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-23 17:12:28 -0700
+ Commit: 9b76332, github.com/apache/spark/pull/1510
+
+ [SPARK-2102][SQL][CORE] Add option for kryo registration required and use a resource pool in Spark SQL for Kryo instances.
+ Ian O Connell <ioconnell@twitter.com>
+ 2014-07-23 16:30:06 -0700
+ Commit: efdaeb1, github.com/apache/spark/pull/1377
+
+ [SPARK-2569][SQL] Fix shipping of TEMPORARY hive UDFs.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-23 16:26:55 -0700
+ Commit: 1871574, github.com/apache/spark/pull/1552
+
+ SPARK-2226: [SQL] transform HAVING clauses with aggregate expressions that aren't in the aggregation list
+ William Benton <willb@redhat.com>
+ 2014-07-23 16:25:32 -0700
+ Commit: e060d3e, github.com/apache/spark/pull/1497
+
+ SPARK-2277: clear host->rack info properly
+ Rui Li <rui.li@intel.com>
+ 2014-07-23 16:23:24 -0700
+ Commit: 91903e0, github.com/apache/spark/pull/1454
+
+ [SPARK-2588][SQL] Add some more DSLs.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-23 14:47:23 -0700
+ Commit: 1b790cf, github.com/apache/spark/pull/1491
+
+ [CORE] SPARK-2640: In "local[N]", free cores of the only executor should be touched by "spark.task.cpus" for every finish/start-up of tasks.
+ woshilaiceshide <woshilaiceshide@qq.com>
+ 2014-07-23 11:05:41 -0700
+ Commit: f776bc9, github.com/apache/spark/pull/1544
+
+ [SPARK-2609] Log thread ID when spilling ExternalAppendOnlyMap
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-23 10:31:45 -0700
+ Commit: 2592111, github.com/apache/spark/pull/1517
+
+ [SPARK-2617] Correct doc and usages of preservesPartitioning
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-23 00:58:55 -0700
+ Commit: 4c7243e, github.com/apache/spark/pull/1526
+
+ Remove GraphX MessageToPartition for compatibility with sort-based shuffle
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-07-22 22:18:30 -0700
+ Commit: 6c2be93, github.com/apache/spark/pull/1537
+
+ [YARN] SPARK-2577: File upload to viewfs is broken due to mount point re...
+ Gera Shegalov <gera@twitter.com>
+ 2014-07-22 21:05:12 -0500
+ Commit: 02e4572, github.com/apache/spark/pull/1483
+
+ [YARN][SPARK-2606]:In some cases,the spark UI pages display incorrect
+ GuoQiang Li <witgo@qq.com>
+ 2014-07-22 20:34:40 -0500
+ Commit: ddadf1b, github.com/apache/spark/pull/1501
+
+ Graphx example
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-07-22 18:14:44 -0700
+ Commit: 5f7b991, github.com/apache/spark/pull/1523
+
+ [SPARK-2615] [SQL] Add Equal Sign "==" Support for HiveQl
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-07-22 18:13:28 -0700
+ Commit: 79fe763, github.com/apache/spark/pull/1522
+
+ SPARK-2047: Introduce an in-mem Sorter, and use it to reduce mem usage
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-22 11:58:53 -0700
+ Commit: 85d3596, github.com/apache/spark/pull/1502
+
+ [MLLIB] make Mima ignore updateFeatures (private) in ALS
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-22 11:45:37 -0700
+ Commit: 1407871, github.com/apache/spark/pull/1533
+
+ [SPARK-2612] [mllib] Fix data skew in ALS
+ peng.zhang <peng.zhang@xiaomi.com>
+ 2014-07-22 02:39:07 -0700
+ Commit: 75db174, github.com/apache/spark/pull/1521
+
+ [SPARK-2452] Create a new valid for each instead of using lineId.
+ Prashant Sharma <prashant@apache.org>
+ 2014-07-22 00:38:26 -0700
+ Commit: 81fec99, github.com/apache/spark/pull/1441
+
+ [SPARK-2470] PEP8 fixes to PySpark
+ Nicholas Chammas <nicholas.chammas@gmail.com>, nchammas <nicholas.chammas@gmail.com>
+ 2014-07-21 22:30:53 -0700
+ Commit: 5d16d5b, github.com/apache/spark/pull/1505
+
+ [SPARK-2086] Improve output of toDebugString to make shuffle boundaries more clear
+ Gregory Owen <greowen@gmail.com>
+ 2014-07-21 18:55:01 -0700
+ Commit: c3462c6, github.com/apache/spark/pull/1364
+
+ [SPARK-2561][SQL] Fix apply schema
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-21 18:18:17 -0700
+ Commit: 511a731, github.com/apache/spark/pull/1470
+
+ [SPARK-2434][MLlib]: Warning messages that point users to original MLlib implementations added to Examples
+ Burak <brkyvz@gmail.com>
+ 2014-07-21 17:03:40 -0700
+ Commit: a4d6020, github.com/apache/spark/pull/1515
+
+ Fix flakey HiveQuerySuite test
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-21 14:35:15 -0700
+ Commit: abeacff, github.com/apache/spark/pull/1514
+
+ [SPARK-2494] [PySpark] make hash of None consistant cross machines
+ Davies Liu <davies.liu@gmail.com>
+ 2014-07-21 11:59:54 -0700
+ Commit: 872538c, github.com/apache/spark/pull/1371
+
+ SPARK-1707. Remove unnecessary 3 second sleep in YarnClusterScheduler
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-21 13:15:46 -0500
+ Commit: f89cf65, github.com/apache/spark/pull/634
+
+ [SPARK-2190][SQL] Specialized ColumnType for Timestamp
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-21 00:46:28 -0700
+ Commit: cd273a2, github.com/apache/spark/pull/1440
+
+ [SPARK-1945][MLLIB] Documentation Improvements for Spark 1.0
+ Michael Giannakopoulos <miccagiann@gmail.com>
+ 2014-07-20 20:48:44 -0700
+ Commit: db56f2d, github.com/apache/spark/pull/1311
+
+ Improve scheduler delay tooltip.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-07-20 20:18:18 -0700
+ Commit: f6e7302, github.com/apache/spark/pull/1488
+
+ [SPARK-2552][MLLIB] stabilize logistic function in pyspark
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-20 18:40:36 -0700
+ Commit: b86db51, github.com/apache/spark/pull/1493
+
+ SPARK-2564. ShuffleReadMetrics.totalBlocksRead is redundant
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-20 14:45:34 -0700
+ Commit: 9564f85, github.com/apache/spark/pull/1474
+
+ [SPARK-2495][MLLIB] remove private[mllib] from linear models' constructors
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-20 13:04:59 -0700
+ Commit: 1b10b81, github.com/apache/spark/pull/1492
+
+ [SPARK-2598] RangePartitioner's binary search does not use the given Ordering
+ Reynold Xin <rxin@apache.org>
+ 2014-07-20 11:06:06 -0700
+ Commit: fa51b0f, github.com/apache/spark/pull/1500
+
+ SPARK-2519 part 2. Remove pattern matching on Tuple2 in critical section...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-20 01:24:32 -0700
+ Commit: 98ab411, github.com/apache/spark/pull/1447
+
+ [SPARK-2524] missing document about spark.deploy.retainedDrivers
+ lianhuiwang <lianhuiwang09@gmail.com>, Wang Lianhui <lianhuiwang09@gmail.com>, unknown <Administrator@taguswang-PC1.tencent.com>
+ 2014-07-19 20:46:59 -0700
+ Commit: 4da01e3, github.com/apache/spark/pull/1443
+
+ SPARK-2587: Fix error message in make-distribution.sh
+ Mark Wagner <mwagner@mwagner-ld.linkedin.biz>
+ 2014-07-19 20:24:13 -0700
+ Commit: c119498, github.com/apache/spark/pull/1489
+
+ Typo fix to the programming guide in the docs
+ Cesar Arevalo <cesar@zephyrhealthinc.com>
+ 2014-07-19 20:20:07 -0700
+ Commit: 0d01e85, github.com/apache/spark/pull/1495
+
+ SPARK-2596 HOTFIX: Deal with non-existent JIRAs.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-19 18:24:21 -0700
+ Commit: d39e3b9
+
+ SPARK-2596 A tool for mirroring github pull requests on JIRA.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-19 18:19:08 -0700
+ Commit: 49e4727, github.com/apache/spark/pull/1496
+
+ Revert "[SPARK-2521] Broadcast RDD object (instead of sending it along with every task)."
+ Reynold Xin <rxin@apache.org>
+ 2014-07-19 16:56:22 -0700
+ Commit: 1efb369
+
+ SPARK-2407: Added Parser of SQL SUBSTR()
+ chutium <teng.qiu@gmail.com>
+ 2014-07-19 11:04:41 -0500
+ Commit: 2a73211, github.com/apache/spark/pull/1442
+
+ put 'curRequestSize = 0' after 'logDebug' it
+ Lijie Xu <csxulijie@gmail.com>
+ 2014-07-19 01:27:26 -0700
+ Commit: 805f329, github.com/apache/spark/pull/1477
+
+ [SPARK-2521] Broadcast RDD object (instead of sending it along with every task).
+ Reynold Xin <rxin@apache.org>
+ 2014-07-18 23:52:47 -0700
+ Commit: 7b8cd17, github.com/apache/spark/pull/1452
+
+ [SPARK-2359][MLlib] Correlations
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-07-18 17:25:32 -0700
+ Commit: a243364, github.com/apache/spark/pull/1367
+
+ [SPARK-2571] Correctly report shuffle read metrics.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-07-18 14:40:32 -0700
+ Commit: 7b971b9, github.com/apache/spark/pull/1476
+
+ [SPARK-2540] [SQL] Add HiveDecimal & HiveVarchar support in unwrapping data
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-07-18 16:38:11 -0500
+ Commit: 7f17208, github.com/apache/spark/pull/1436
+
+ [SPARK-2535][SQL] Add StringComparison case to NullPropagation.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-18 16:24:00 -0500
+ Commit: 3a1709f, github.com/apache/spark/pull/1451
+
+ [MLlib] SPARK-1536: multiclass classification support for decision tree
+ Manish Amde <manish9ue@gmail.com>, manishamde <manish9ue@gmail.com>, Evan Sparks <sparks@cs.berkeley.edu>
+ 2014-07-18 14:00:13 -0700
+ Commit: d88f6be, github.com/apache/spark/pull/886
+
+ Reservoir sampling implementation.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-18 12:41:50 -0700
+ Commit: 586e716, github.com/apache/spark/pull/1478
+
+ Added t2 instance types
+ Basit Mustafa <basitmustafa@computes-things-for-basit.local>
+ 2014-07-18 12:23:47 -0700
+ Commit: 7f87ab9, github.com/apache/spark/pull/1446
+
+ SPARK-2553. Fix compile error
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-18 00:47:43 -0700
+ Commit: 30b8d36, github.com/apache/spark/pull/1479
+
+ SPARK-2553. CoGroupedRDD unnecessarily allocates a Tuple2 per dependency...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-17 23:57:08 -0700
+ Commit: e52b871, github.com/apache/spark/pull/1461
+
+ [SPARK-2570] [SQL] Fix the bug of ClassCastException
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-07-17 23:25:01 -0700
+ Commit: 29809a6, github.com/apache/spark/pull/1475
+
+ [SPARK-2411] Add a history-not-found page to standalone Master
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-17 19:45:59 -0700
+ Commit: 6afca2d, github.com/apache/spark/pull/1336
+
+ [SPARK-2299] Consolidate various stageIdTo* hash maps in JobProgressListener
+ Reynold Xin <rxin@apache.org>
+ 2014-07-17 18:58:48 -0700
+ Commit: 72e9021, github.com/apache/spark/pull/1262
+
+ SPARK-1215 [MLLIB]: Clustering: Index out of bounds error (2)
+ Joseph K. Bradley <joseph.kurata.bradley@gmail.com>
+ 2014-07-17 15:05:02 -0700
+ Commit: 935fe65, github.com/apache/spark/pull/1468
+
+ SPARK-1478.2 Fix incorrect NioServerSocketChannelFactory constructor call
+ Sean Owen <srowen@gmail.com>
+ 2014-07-17 12:20:48 -0700
+ Commit: 1fcd5dc, github.com/apache/spark/pull/1466
+
+ [SPARK-2534] Avoid pulling in the entire RDD in various operators
+ Reynold Xin <rxin@apache.org>
+ 2014-07-17 10:54:53 -0700
+ Commit: d988d34, github.com/apache/spark/pull/1450
+
+ [SPARK-2423] Clean up SparkSubmit for readability
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-17 01:13:32 -0700
+ Commit: 9c73822, github.com/apache/spark/pull/1349
+
+ SPARK-2526: Simplify options in make-distribution.sh
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-17 01:02:35 -0700
+ Commit: d0ea496, github.com/apache/spark/pull/1445
+
+ [SPARK-2412] CoalescedRDD throws exception with certain pref locs
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-17 01:01:14 -0700
+ Commit: 7c23c0d, github.com/apache/spark/pull/1337
+
+ [SPARK-2154] Schedule next Driver when one completes (standalone mode)
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-16 14:16:48 -0700
+ Commit: 9c24974, github.com/apache/spark/pull/1405
+
+ SPARK-1097: Do not introduce deadlock while fixing concurrency bug
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-16 14:10:17 -0700
+ Commit: 8867cd0, github.com/apache/spark/pull/1409
+
+ [SPARK-2317] Improve task logging.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-16 11:50:49 -0700
+ Commit: 7c8d123, github.com/apache/spark/pull/1259
+
+ fix compile error of streaming project
+ James Z.M. Gao <gaozhm@mediav.com>
+ 2014-07-16 11:35:21 -0700
+ Commit: caa163f, github.com/apache/spark/pull/153
+
+ [SPARK-2522] set default broadcast factory to torrent
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-16 11:27:51 -0700
+ Commit: 96f28c9, github.com/apache/spark/pull/1437
+
+ [SPARK-2517] Remove some compiler warnings.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-16 11:15:07 -0700
+ Commit: ef48222, github.com/apache/spark/pull/1433
+
+ [SPARK-2518][SQL] Fix foldability of Substring expression.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-16 11:13:38 -0700
+ Commit: cc965ee, github.com/apache/spark/pull/1432
+
+ SPARK-2519. Eliminate pattern-matching on Tuple2 in performance-critical...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-16 11:07:16 -0700
+ Commit: fc7edc9, github.com/apache/spark/pull/1435
+
+ [SQL] Cleaned up ConstantFolding slightly.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-16 10:55:47 -0700
+ Commit: 1c5739f, github.com/apache/spark/pull/1430
+
+ [SPARK-2525][SQL] Remove as many compilation warning messages as possible in Spark SQL
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-16 10:53:59 -0700
+ Commit: df95d82, github.com/apache/spark/pull/1444
+
+ Tightening visibility for various Broadcast related classes.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-16 10:44:54 -0700
+ Commit: efe2a8b, github.com/apache/spark/pull/1438
+
+ SPARK-2277: make TaskScheduler track hosts on rack
+ Rui Li <rui.li@intel.com>
+ 2014-07-16 22:53:37 +0530
+ Commit: 33e64ec, github.com/apache/spark/pull/1212
+
+ [SPARK-2119][SQL] Improved Parquet performance when reading off S3
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-16 12:44:51 -0400
+ Commit: efc452a, github.com/apache/spark/pull/1370
+
+ [SPARK-2504][SQL] Fix nullability of Substring expression.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-15 22:43:48 -0700
+ Commit: 632fb3d, github.com/apache/spark/pull/1426
+
+ [SPARK-2509][SQL] Add optimization for Substring.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-15 22:35:34 -0700
+ Commit: 9b38b7c, github.com/apache/spark/pull/1428
+
+ [SPARK-2314][SQL] Override collect and take in JavaSchemaRDD, forwarding to SchemaRDD implementations.
+ Aaron Staple <aaron.staple@gmail.com>
+ 2014-07-15 21:35:36 -0700
+ Commit: 90ca532, github.com/apache/spark/pull/1421
+
+ follow pep8 None should be compared using is or is not
+ Ken Takagiwa <ken@Kens-MacBook-Pro.local>
+ 2014-07-15 21:34:05 -0700
+ Commit: 563acf5, github.com/apache/spark/pull/1422
+
+ [SPARK-2500] Move the logInfo for registering BlockManager to BlockManagerMasterActor.register method
+ Henry Saputra <henry.saputra@gmail.com>
+ 2014-07-15 21:21:52 -0700
+ Commit: 9c12de5, github.com/apache/spark/pull/1424
+
+ [SPARK-2469] Use Snappy (instead of LZF) for default shuffle compression codec
+ Reynold Xin <rxin@apache.org>
+ 2014-07-15 18:47:39 -0700
+ Commit: 4576d80, github.com/apache/spark/pull/1415
+
+ [SPARK-2498] [SQL] Synchronize on a lock when using scala reflection inside data type objects.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-07-15 17:58:28 -0700
+ Commit: c2048a5, github.com/apache/spark/pull/1423
+
+ [SQL] Attribute equality comparisons should be done by exprId.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-15 17:56:17 -0700
+ Commit: 502f907, github.com/apache/spark/pull/1414
+
+ SPARK-2407: Added internal implementation of SQL SUBSTR()
+ William Benton <willb@redhat.com>
+ 2014-07-15 14:11:57 -0700
+ Commit: 61de65b, github.com/apache/spark/pull/1359
+
+ [SPARK-2474][SQL] For a registered table in OverrideCatalog, the Analyzer failed to resolve references in the format of "tableName.fieldName"
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-15 14:06:45 -0700
+ Commit: 8af46d5, github.com/apache/spark/pull/1406
+
+ [SQL] Whitelist more Hive tests.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-15 14:04:01 -0700
+ Commit: bcd0c30, github.com/apache/spark/pull/1396
+
+ [SPARK-2483][SQL] Fix parsing of repeated, nested data access.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-15 14:01:48 -0700
+ Commit: 0f98ef1, github.com/apache/spark/pull/1411
+
+ [SPARK-2471] remove runtime scope for jets3t
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-15 14:00:54 -0700
+ Commit: a21f9a7, github.com/apache/spark/pull/1402
+
+ Added LZ4 to compression codec in configuration page.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-15 13:13:33 -0700
+ Commit: e7ec815, github.com/apache/spark/pull/1417
+
+ SPARK-1291: Link the spark UI to RM ui in yarn-client mode
+ witgo <witgo@qq.com>
+ 2014-07-15 13:52:56 -0500
+ Commit: 72ea56d, github.com/apache/spark/pull/1112
+
+ SPARK-2480: Resolve sbt warnings "NOTE: SPARK_YARN is deprecated, please use -Pyarn flag"
+ witgo <witgo@qq.com>
+ 2014-07-15 10:46:17 -0700
+ Commit: 9dd635e, github.com/apache/spark/pull/1404
+
+ Reformat multi-line closure argument.
+ William Benton <willb@redhat.com>
+ 2014-07-15 09:13:39 -0700
+ Commit: cb09e93, github.com/apache/spark/pull/1419
+
+ [MLLIB] [SPARK-2222] Add multiclass evaluation metrics
+ Alexander Ulanov <nashb@yandex.ru>, unknown <ulanov@ULANOV1.emea.hpqcorp.net>, Xiangrui Meng <meng@databricks.com>
+ 2014-07-15 08:40:22 -0700
+ Commit: 04b01bb, github.com/apache/spark/pull/1155
+
+ README update: added "for Big Data".
+ Reynold Xin <rxin@apache.org>
+ 2014-07-15 02:20:01 -0700
+ Commit: 6555618
+
+ Update README.md to include a slightly more informative project description.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-15 02:15:29 -0700
+ Commit: 8f1d422
+
+ [SPARK-2477][MLlib] Using appendBias for adding intercept in GeneralizedLinearAlgorithm
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-07-15 02:14:58 -0700
+ Commit: 52beb20, github.com/apache/spark/pull/1410
+
+ [SPARK-2399] Add support for LZ4 compression.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-15 01:46:57 -0700
+ Commit: dd95aba, github.com/apache/spark/pull/1416
+
+ discarded exceeded completedDrivers
+ lianhuiwang <lianhuiwang09@gmail.com>
+ 2014-07-15 00:22:06 -0700
+ Commit: 7446f5f, github.com/apache/spark/pull/1114
+
+ [SPARK-2485][SQL] Lock usage of hive client.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-15 00:13:51 -0700
+ Commit: c7c7ac8, github.com/apache/spark/pull/1412
+
+ [SPARK-2390] Files in staging directory cannot be deleted and wastes the space of HDFS
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-07-14 23:55:39 -0700
+ Commit: c6d7574, github.com/apache/spark/pull/1326
+
+ Add/increase severity of warning in documentation of groupBy()
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-14 23:38:12 -0700
+ Commit: a2aa7be, github.com/apache/spark/pull/1380
+
+ SPARK-2486: Utils.getCallSite is now resilient to bogus frames
+ William Benton <willb@redhat.com>
+ 2014-07-14 23:09:13 -0700
+ Commit: 1f99fea, github.com/apache/spark/pull/1413
+
+ [SPARK-2467] Revert SparkBuild to publish-local to both .m2 and .ivy2.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-14 23:06:35 -0700
+ Commit: e2255e4, github.com/apache/spark/pull/1398
+
+ [SPARK-2446][SQL] Add BinaryType support to Parquet I/O.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-14 15:42:28 -0700
+ Commit: 9fe693b, github.com/apache/spark/pull/1373
+
+ [SPARK-1946] Submit tasks after (configured ratio) executors have been registered
+ li-zhihui <zhihui.li@intel.com>
+ 2014-07-14 15:32:49 -0500
+ Commit: 3dd8af7, github.com/apache/spark/pull/900
+
+ [SPARK-2443][SQL] Fix slow read from partitioned tables
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-07-14 13:22:24 -0700
+ Commit: d60b09b, github.com/apache/spark/pull/1408
+
+ move some test file to match src code
+ Daoyuan <daoyuan.wang@intel.com>
+ 2014-07-14 10:40:44 -0700
+ Commit: 38ccd6e, github.com/apache/spark/pull/1401
+
+ Made rdd.py pep8 complaint by using Autopep8 and a little manual editing.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-14 00:42:59 -0700
+ Commit: aab5349, github.com/apache/spark/pull/1354
+
+ SPARK-2363. Clean MLlib's sample data files
+ Sean Owen <sowen@cloudera.com>
+ 2014-07-13 19:27:43 -0700
+ Commit: 635888c, github.com/apache/spark/pull/1394
+
+ SPARK-2462. Make Vector.apply public.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-07-12 16:55:15 -0700
+ Commit: 4c8be64, github.com/apache/spark/pull/1389
+
+ [SPARK-2405][SQL] Reusue same byte buffers when creating new instance of InMemoryRelation
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-12 12:13:32 -0700
+ Commit: 1a7d7cc, github.com/apache/spark/pull/1332
+
+ [SPARK-2441][SQL] Add more efficient distinct operator.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-12 12:07:27 -0700
+ Commit: 7e26b57, github.com/apache/spark/pull/1366
+
+ [SPARK-2455] Mark (Shippable)VertexPartition serializable
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-07-12 12:05:34 -0700
+ Commit: 7a01352, github.com/apache/spark/pull/1376
+
+ Use the Executor's ClassLoader in sc.objectFile().
+ Daniel Darabos <darabos.daniel@gmail.com>
+ 2014-07-12 00:07:42 -0700
+ Commit: 2245c87, github.com/apache/spark/pull/181
+
+ use specialized axpy in RowMatrix for SVD
+ Li Pu <lpu@twitter.com>, Xiangrui Meng <meng@databricks.com>, Li Pu <li.pu@outlook.com>
+ 2014-07-11 23:26:47 -0700
+ Commit: d38887b, github.com/apache/spark/pull/1378
+
+ [SPARK-1969][MLlib] Online summarizer APIs for mean, variance, min, and max
+ DB Tsai <dbtsai@dbtsai.com>
+ 2014-07-11 23:04:43 -0700
+ Commit: 5596086, github.com/apache/spark/pull/955
+
+ [SPARK-2457] Inconsistent description in README about build option
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-07-11 21:10:26 -0700
+ Commit: cbff187, github.com/apache/spark/pull/1382
+
+ [SPARK-2437] Rename MAVEN_PROFILES to SBT_MAVEN_PROFILES and add SBT_MAVEN_PROPERTIES
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-11 11:52:35 -0700
+ Commit: b23e9c3, github.com/apache/spark/pull/1374
+
+ [Minor] Remove unused val in Master
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-11 00:21:16 -0700
+ Commit: f4f46de, github.com/apache/spark/pull/1365
+
+ fix Graph partitionStrategy comment
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-07-11 00:02:24 -0700
+ Commit: 282cca0, github.com/apache/spark/pull/1368
+
+ [SPARK-2358][MLLIB] Add an option to include native BLAS/LAPACK loader in the build
+ Xiangrui Meng <meng@databricks.com>
+ 2014-07-10 21:57:54 -0700
+ Commit: 2f59ce7, github.com/apache/spark/pull/1295
+
+ [SPARK-2428][SQL] Add except and intersect methods to SchemaRDD.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-10 19:27:24 -0700
+ Commit: 10b59ba, github.com/apache/spark/pull/1355
+
+ [SPARK-2415] [SQL] RowWriteSupport should handle empty ArrayType correctly.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-10 19:23:44 -0700
+ Commit: f5abd27, github.com/apache/spark/pull/1339
+
+ [SPARK-2431][SQL] Refine StringComparison and related codes.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-10 19:20:00 -0700
+ Commit: f62c427, github.com/apache/spark/pull/1357
+
+ SPARK-2427: Fix Scala examples that use the wrong command line arguments index
+ Artjom-Metro <Artjom-Metro@users.noreply.github.com>, Artjom-Metro <artjom31415@googlemail.com>
+ 2014-07-10 16:03:30 -0700
+ Commit: ae8ca4d, github.com/apache/spark/pull/1353
+
+ [SPARK-1341] [Streaming] Throttle BlockGenerator to limit rate of data consumption.
+ Issac Buenrostro <buenrostro@ooyala.com>
+ 2014-07-10 16:01:08 -0700
+ Commit: 2dd6724, github.com/apache/spark/pull/945
+
+ [SPARK-1478].3: Upgrade FlumeInputDStream's FlumeReceiver to support FLUME-1915
+ tmalaska <ted.malaska@cloudera.com>, Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-07-10 13:15:02 -0700
+ Commit: 40a8fef, github.com/apache/spark/pull/1347
+
+ name ec2 instances and security groups consistently
+ Nicholas Chammas <nicholas.chammas@gmail.com>, nchammas <nicholas.chammas@gmail.com>
+ 2014-07-10 12:56:00 -0700
+ Commit: 369aa84, github.com/apache/spark/pull/1344
+
+ HOTFIX: Minor doc update for sbt change
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-10 11:10:43 -0700
+ Commit: 88006a6
+
+ [SPARK-1776] Have Spark's SBT build read dependencies from Maven.
+ Prashant Sharma <prashant.s@imaginea.com>, Patrick Wendell <pwendell@gmail.com>
+ 2014-07-10 11:03:37 -0700
+ Commit: 628932b, github.com/apache/spark/pull/772
+
+ SPARK-2115: Stage kill link is too close to stage details link
+ Masayoshi TSUZUKI <tsudukim@oss.nttdata.co.jp>
+ 2014-07-10 01:18:37 -0700
+ Commit: c2babc0, github.com/apache/spark/pull/1350
+
+ Clean up SparkKMeans example's code
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-07-09 23:39:29 -0700
+ Commit: 2b18ea9, github.com/apache/spark/pull/1352
+
+ HOTFIX: Remove persistently failing test in master.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-09 19:44:24 -0700
+ Commit: 553c578
+
+ Revert "[HOTFIX] Synchronize on SQLContext.settings in tests."
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-09 19:36:38 -0700
+ Commit: dd22bc2
+
+ SPARK-2416: Allow richer reporting of unit test results
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-09 19:26:16 -0700
+ Commit: 2e0a037, github.com/apache/spark/pull/1340
+
+ SPARK-1782: svd for sparse matrix using ARPACK
+ Li Pu <lpu@twitter.com>, Xiangrui Meng <meng@databricks.com>, Li Pu <li.pu@outlook.com>
+ 2014-07-09 12:15:08 -0700
+ Commit: 1f33e1f, github.com/apache/spark/pull/964
+
+ [SPARK-2417][MLlib] Fix DecisionTree tests
+ johnnywalleye <jsondag@gmail.com>
+ 2014-07-09 11:06:34 -0700
+ Commit: d35e3db, github.com/apache/spark/pull/1343
+
+ [STREAMING] SPARK-2343: Fix QueueInputDStream with oneAtATime false
+ Manuel Laflamme <manuel.laflamme@gmail.com>
+ 2014-07-09 10:45:45 -0700
+ Commit: 0eb1152, github.com/apache/spark/pull/1285
+
+ [SPARK-2384] Add tooltips to UI.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-07-08 22:57:21 -0700
+ Commit: 339441f, github.com/apache/spark/pull/1314
+
+ [SPARK-2152][MLlib] fix bin offset in DecisionTree node aggregations (also resolves SPARK-2160)
+ johnnywalleye <jsondag@gmail.com>
+ 2014-07-08 19:17:26 -0700
+ Commit: 1114207, github.com/apache/spark/pull/1316
+
+ [SPARK-2413] Upgrade junit_xml_listener to 0.5.1
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-07-08 17:50:36 -0700
+ Commit: ac9cdc1, github.com/apache/spark/pull/1333
+
+ [SPARK-2392] Executors should not start their own HTTP servers
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-08 17:35:31 -0700
+ Commit: bf04a39, github.com/apache/spark/pull/1335
+
+ [SPARK-2362] Fix for newFilesOnly logic in file DStream
+ Gabriele Nizzoli <mail@nizzoli.net>
+ 2014-07-08 14:23:38 -0700
+ Commit: e6f7bfc, github.com/apache/spark/pull/1077
+
+ [SPARK-2409] Make SQLConf thread safe.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-08 14:00:47 -0700
+ Commit: 32516f8, github.com/apache/spark/pull/1334
+
+ SPARK-2400 : fix spark.yarn.max.executor.failures explaination
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-07-08 13:55:42 -0500
+ Commit: b520b64, github.com/apache/spark/pull/1282
+
+ [SPARK-2403] Catch all errors during serialization in DAGScheduler
+ Daniel Darabos <darabos.daniel@gmail.com>
+ 2014-07-08 10:43:46 -0700
+ Commit: c8a2313, github.com/apache/spark/pull/1329
+
+ [SPARK-2395][SQL] Optimize common LIKE patterns.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-08 10:36:18 -0700
+ Commit: cc3e0a1, github.com/apache/spark/pull/1325
+
+ [EC2] Add default history server port to ec2 script
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-08 16:49:31 +0900
+ Commit: 56e009d, github.com/apache/spark/pull/1296
+
+ [SPARK-2391][SQL] Custom take() for LIMIT queries.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-08 00:41:46 -0700
+ Commit: 5a40636, github.com/apache/spark/pull/1318
+
+ Resolve sbt warnings during build â…¡
+ witgo <witgo@qq.com>
+ 2014-07-08 00:31:42 -0700
+ Commit: 3cd5029, github.com/apache/spark/pull/1153
+
+ Updated programming-guide.md
+ Rishi Verma <riverma@apache.org>
+ 2014-07-08 00:29:23 -0700
+ Commit: 0128905, github.com/apache/spark/pull/1324
+
+ [SPARK-2235][SQL]Spark SQL basicOperator add Intersect operator
+ Yanjie Gao <gaoyanjie55@163.com>, YanjieGao <396154235@qq.com>
+ 2014-07-07 19:40:04 -0700
+ Commit: 50561f4, github.com/apache/spark/pull/1150
+
+ [SPARK-2376][SQL] Selecting list values inside nested JSON objects raises java.lang.IllegalArgumentException
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-07 18:37:38 -0700
+ Commit: 4352a2f, github.com/apache/spark/pull/1320
+
+ [SPARK-2375][SQL] JSON schema inference may not resolve type conflicts correctly for a field inside an array of structs
+ Yin Huai <huaiyin.thu@gmail.com>
+ 2014-07-07 17:05:59 -0700
+ Commit: f0496ee, github.com/apache/spark/pull/1308
+
+ [SPARK-2386] [SQL] RowWriteSupport should use the exact types to cast.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-07 17:04:02 -0700
+ Commit: 4deeed1, github.com/apache/spark/pull/1315
+
+ [SPARK-2339][SQL] SQL parser in sql-core is case sensitive, but a table alias is converted to lower case when we create Subquery
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-07-07 17:01:44 -0700
+ Commit: c0b4cf0, github.com/apache/spark/pull/1317
+
+ [SPARK-1977][MLLIB] register mutable BitSet in MovieLenseALS
+ Neville Li <neville@spotify.com>
+ 2014-07-07 15:06:14 -0700
+ Commit: f7ce1b3, github.com/apache/spark/pull/1319
+
+ [SPARK-2327] [SQL] Fix nullabilities of Join/Generate/Aggregate.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-05 11:51:48 -0700
+ Commit: 9d5ecf8, github.com/apache/spark/pull/1266
+
+ [SPARK-2366] [SQL] Add column pruning for the right side of LeftSemi join.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-05 11:48:08 -0700
+ Commit: 3da8df9, github.com/apache/spark/pull/1301
+
+ [SPARK-2306]:BoundedPriorityQueue is private and not registered with Kry...
+ ankit.bhardwaj <ankit.bhardwaj@guavus.com>
+ 2014-07-04 22:06:10 -0700
+ Commit: 42f3abd, github.com/apache/spark/pull/1299
+
+ [SPARK-2370][SQL] Decrease metadata retrieved for partitioned hive queries.
+ Michael Armbrust <michael@databricks.com>
+ 2014-07-04 19:15:48 -0700
+ Commit: 9d006c9, github.com/apache/spark/pull/1305
+
+ Added SignalLogger to HistoryServer.
+ Reynold Xin <rxin@apache.org>
+ 2014-07-04 17:33:07 -0700
+ Commit: 0db5d5a, github.com/apache/spark/pull/1300
+
+ HOTFIX: Clean before building docs during release.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-07-04 10:01:19 -0700
+ Commit: fc71658
+
+ [SPARK-2234][SQL]Spark SQL basicOperators add Except operator
+ Yanjie Gao <gaoyanjie55@163.com>, YanjieGao <396154235@qq.com>, root <root@node4.(none)>, gaoyanjie <gaoyanjie55@163.com>
+ 2014-07-04 02:43:57 -0700
+ Commit: 5dadda8, github.com/apache/spark/pull/1151
+
+ [SPARK-2059][SQL] Add analysis checks
+ Reynold Xin <rxin@apache.org>, Michael Armbrust <michael@databricks.com>
+ 2014-07-04 00:53:41 -0700
+ Commit: b3e768e, github.com/apache/spark/pull/1265
+
+ Update SQLConf.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-07-04 00:25:31 -0700
+ Commit: 0bbe612, github.com/apache/spark/pull/1272
+
+ [SPARK-1199][REPL] Remove VALId and use the original import style for defined classes.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-04 00:05:27 -0700
+ Commit: d434150, github.com/apache/spark/pull/1179
+
+ [SPARK-2059][SQL] Don't throw TreeNodeException in `execution.ExplainCommand`
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-07-03 23:41:54 -0700
+ Commit: 5448804, github.com/apache/spark/pull/1294
+
+ SPARK-2282: Reuse PySpark Accumulator sockets to avoid crashing Spark
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-03 23:02:36 -0700
+ Commit: 97a0bfe, github.com/apache/spark/pull/1220
+
+ [SPARK-2307][Reprise] Correctly report RDD blocks on SparkUI
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-03 22:48:23 -0700
+ Commit: 3894a49, github.com/apache/spark/pull/1255
+
+ [SPARK-2350] Don't NPE while launching drivers
+ Aaron Davidson <aaron@databricks.com>
+ 2014-07-03 22:31:41 -0700
+ Commit: 586feb5, github.com/apache/spark/pull/1289
+
+ [SPARK-1097] Workaround Hadoop conf ConcurrentModification issue
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-07-03 19:24:22 -0700
+ Commit: 5fa0a05, github.com/apache/spark/pull/1273
+
+ Streaming programming guide typos
+ Clément MATHIEU <clement@unportant.info>
+ 2014-07-03 18:31:18 -0700
+ Commit: fdc4c11, github.com/apache/spark/pull/1286
+
+ [HOTFIX] Synchronize on SQLContext.settings in tests.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-07-03 17:37:53 -0700
+ Commit: d4c30cd, github.com/apache/spark/pull/1277
+
+ [SPARK-2109] Setting SPARK_MEM for bin/pyspark does not work.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-07-03 15:06:58 -0700
+ Commit: 731f683b, github.com/apache/spark/pull/1050
+
+ [SPARK-2342] Evaluation helper's output type doesn't conform to input ty...
+ Yijie Shen <henry.yijieshen@gmail.com>
+ 2014-07-03 13:22:13 -0700
+ Commit: a9b52e5, github.com/apache/spark/pull/1283
+
+ SPARK-1675. Make clear whether computePrincipalComponents requires centered data
+ Sean Owen <sowen@cloudera.com>
+ 2014-07-03 11:54:51 -0700
+ Commit: 2b36344, github.com/apache/spark/pull/1171
+
+ [SPARK] Fix NPE for ExternalAppendOnlyMap
+ Andrew Or <andrewor14@gmail.com>
+ 2014-07-03 10:26:50 -0700
+ Commit: c480537, github.com/apache/spark/pull/1288
+
+ [SPARK-2324] SparkContext should not exit directly when spark.local.dir is a list of multiple paths and one of them has error
+ yantangzhai <tyz0303@163.com>
+ 2014-07-03 10:14:35 -0700
+ Commit: 3bbeca6, github.com/apache/spark/pull/1274
+
+ [SPARK-2287] [SQL] Make ScalaReflection be able to handle Generic case classes.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-02 10:10:36 -0700
+ Commit: bc7041a, github.com/apache/spark/pull/1226
+
+ [SPARK-2328] [SQL] Add execution of `SHOW TABLES` before `TestHive.reset()`.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-07-02 10:07:01 -0700
+ Commit: 1e2c26c, github.com/apache/spark/pull/1268
+
+ SPARK-2186: Spark SQL DSL support for simple aggregations such as SUM and AVG
+ Ximo Guanter Gonzalbez <ximo@tid.es>
+ 2014-07-02 10:03:44 -0700
+ Commit: 5c6ec94, github.com/apache/spark/pull/1211
+
+ update the comments in SqlParser
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-07-01 20:37:10 -0700
+ Commit: 6596392, github.com/apache/spark/pull/1275
+
+ [SPARK-2185] Emit warning when task size exceeds a threshold.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-07-01 01:56:51 -0700
+ Commit: 05c3d90, github.com/apache/spark/pull/1149
+
+ SPARK-2332 [build] add exclusion for old servlet-api on hadoop-client in core
+ Peter MacKinnon <pmackinn@redhat.com>
+ 2014-07-01 00:28:38 -0700
+ Commit: 3319a3e, github.com/apache/spark/pull/1271
+
+ SPARK-2293. Replace RDD.zip usage by map with predict inside.
+ Sean Owen <sowen@cloudera.com>
+ 2014-06-30 16:03:38 -0700
+ Commit: 04fa122, github.com/apache/spark/pull/1250
+
+ [SPARK-2318] When exiting on a signal, print the signal name first.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-30 15:12:38 -0700
+ Commit: 5fccb56, github.com/apache/spark/pull/1260
+
+ [SPARK-2322] Exception in resultHandler should NOT crash DAGScheduler and shutdown SparkContext.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-30 11:50:22 -0700
+ Commit: 358ae15, github.com/apache/spark/pull/1264
+
+ SPARK-2077 Log serializer that actually ends up being used
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-29 23:29:05 -0700
+ Commit: 6803642, github.com/apache/spark/pull/1017
+
+ SPARK-897: preemptively serialize closures
+ William Benton <willb@redhat.com>
+ 2014-06-29 23:27:34 -0700
+ Commit: a484030, github.com/apache/spark/pull/143
+
+ [SPARK-2104] Fix task serializing issues when sort with Java non serializable class
+ jerryshao <saisai.shao@intel.com>
+ 2014-06-29 23:00:00 -0700
+ Commit: 66135a3, github.com/apache/spark/pull/1245
+
+ [SPARK-1683] Track task read metrics.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-29 22:01:42 -0700
+ Commit: 7b71a0e, github.com/apache/spark/pull/962
+
+ [SPARK-2320] Reduce exception/code block font size in web ui
+ Reynold Xin <rxin@apache.org>
+ 2014-06-29 16:46:28 -0700
+ Commit: cdf613f, github.com/apache/spark/pull/1261
+
+ Improve MapOutputTracker error logging.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-28 21:05:03 -0700
+ Commit: 2053d79, github.com/apache/spark/pull/1258
+
+ [SPARK-1394] Remove SIGCHLD handler in worker subprocess
+ Matthew Farrellee <matt@redhat.com>
+ 2014-06-28 18:39:27 -0700
+ Commit: 3c104c7, github.com/apache/spark/pull/1247
+
+ [SPARK-2233] make-distribution script should list the git hash in the RELEASE file
+ Guillaume Ballet <gballet@gmail.com>
+ 2014-06-28 13:07:12 -0700
+ Commit: b8f2e13, github.com/apache/spark/pull/1216
+
+ [SPARK-2003] Fix python SparkContext example
+ Matthew Farrellee <matt@redhat.com>
+ 2014-06-27 18:20:33 -0700
+ Commit: 0e0686d, github.com/apache/spark/pull/1246
+
+ [SPARK-2259] Fix highly misleading docs on cluster / client deploy modes
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-27 16:11:31 -0700
+ Commit: f17510e, github.com/apache/spark/pull/1200
+
+ [SPARK-2307] SparkUI - storage tab displays incorrect RDDs
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-27 15:23:25 -0700
+ Commit: 21e0f77, github.com/apache/spark/pull/1249
+
+ SPARK-2181:The keys for sorting the columns of Executor page in SparkUI are incorrect
+ witgo <witgo@qq.com>
+ 2014-06-26 21:59:21 -0700
+ Commit: 18f29b9, github.com/apache/spark/pull/1135
+
+ [SPARK-2251] fix concurrency issues in random sampler
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-26 21:46:55 -0700
+ Commit: c23f5db, github.com/apache/spark/pull/1229
+
+ [SPARK-2297][UI] Make task attempt and speculation more explicit in UI.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-26 21:13:26 -0700
+ Commit: d1636dd, github.com/apache/spark/pull/1236
+
+ Removed throwable field from FetchFailedException and added MetadataFetchFailedException
+ Reynold Xin <rxin@apache.org>
+ 2014-06-26 21:12:16 -0700
+ Commit: bf578de, github.com/apache/spark/pull/1227
+
+ [SQL]Extract the joinkeys from join condition
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-06-26 19:18:11 -0700
+ Commit: 981bde9, github.com/apache/spark/pull/1190
+
+ Strip '@' symbols when merging pull requests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-26 17:09:24 -0700
+ Commit: f1f7385, github.com/apache/spark/pull/1239
+
+ Fixing AWS instance type information based upon current EC2 data
+ Zichuan Ye <jerry@tangentds.com>
+ 2014-06-26 15:21:29 -0700
+ Commit: 62d4a0f, github.com/apache/spark/pull/1156
+
+ [SPARK-2286][UI] Report exception/errors for failed tasks that are not ExceptionFailure
+ Reynold Xin <rxin@apache.org>
+ 2014-06-26 14:00:45 -0700
+ Commit: 6587ef7, github.com/apache/spark/pull/1225
+
+ [SPARK-2295] [SQL] Make JavaBeans nullability stricter.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-26 13:37:19 -0700
+ Commit: 32a1ad7, github.com/apache/spark/pull/1235
+
+ Remove use of spark.worker.instances
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-26 08:20:27 -0500
+ Commit: 48a82a8, github.com/apache/spark/pull/1214
+
+ [SPARK-2254] [SQL] ScalaRefection should mark primitive types as non-nullable.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-25 23:55:31 -0700
+ Commit: e4899a2, github.com/apache/spark/pull/1193
+
+ [SPARK-2172] PySpark cannot import mllib modules in YARN-client mode
+ Szul, Piotr <Piotr.Szul@csiro.au>
+ 2014-06-25 21:55:49 -0700
+ Commit: 441cdcc, github.com/apache/spark/pull/1223
+
+ [SPARK-2284][UI] Mark all failed tasks as failures.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-25 22:35:03 -0700
+ Commit: 4a346e2, github.com/apache/spark/pull/1224
+
+ [SPARK-1749] Job cancellation when SchedulerBackend does not implement killTask
+ Mark Hamstra <markhamstra@gmail.com>, Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-25 20:57:48 -0700
+ Commit: b88a59a, github.com/apache/spark/pull/1219
+
+ [SPARK-2283][SQL] Reset test environment before running PruningSuite
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-25 18:41:47 -0700
+ Commit: 7f196b0, github.com/apache/spark/pull/1221
+
+ [SQL] SPARK-1800 Add broadcast hash join operator & associated hints.
+ Zongheng Yang <zongheng.y@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-06-25 18:06:33 -0700
+ Commit: 9d824fe, github.com/apache/spark/pull/1163
+
+ [SPARK-2204] Launch tasks on the proper executors in mesos fine-grained mode
+ Sebastien Rainville <sebastien@hopper.com>
+ 2014-06-25 13:21:18 -0700
+ Commit: 1132e47, github.com/apache/spark/pull/1140
+
+ [SPARK-2270] Kryo cannot serialize results returned by asJavaIterable
+ Reynold Xin <rxin@apache.org>
+ 2014-06-25 12:43:22 -0700
+ Commit: 7ff2c75, github.com/apache/spark/pull/1206
+
+ [SPARK-2258 / 2266] Fix a few worker UI bugs
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-25 12:23:08 -0700
+ Commit: 9aa6032, github.com/apache/spark/pull/1213
+
+ [SPARK-2242] HOTFIX: pyspark shell hangs on simple job
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-25 10:47:22 -0700
+ Commit: 5603e4c, github.com/apache/spark/pull/1178
+
+ Replace doc reference to Shark with Spark SQL.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-25 01:01:23 -0700
+ Commit: ac06a85
+
+ SPARK-2038: rename "conf" parameters in the saveAsHadoop functions with source-compatibility
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-06-25 00:23:32 -0700
+ Commit: acc01ab, github.com/apache/spark/pull/1137
+
+ [BUGFIX][SQL] Should match java.math.BigDecimal when wnrapping Hive output
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-25 00:17:28 -0700
+ Commit: 22036ae, github.com/apache/spark/pull/1199
+
+ [SPARK-2263][SQL] Support inserting MAP<K, V> to Hive tables
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-25 00:14:34 -0700
+ Commit: 8fade89, github.com/apache/spark/pull/1205
+
+ SPARK-2248: spark.default.parallelism does not apply in local mode
+ witgo <witgo@qq.com>
+ 2014-06-24 19:44:37 -0700
+ Commit: b6b4485, github.com/apache/spark/pull/1194
+
+ Fix possible null pointer in acumulator toString
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-24 19:39:19 -0700
+ Commit: 2714968, github.com/apache/spark/pull/1204
+
+ Autodetect JAVA_HOME on RPM-based systems
+ Matthew Farrellee <matt@redhat.com>
+ 2014-06-24 19:31:20 -0700
+ Commit: 54055fb, github.com/apache/spark/pull/1185
+
+ [SQL]Add base row updating methods for JoinedRow
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-06-24 19:07:02 -0700
+ Commit: 133495d, github.com/apache/spark/pull/1187
+
+ [SPARK-1112, 2156] Bootstrap to fetch the driver's Spark properties.
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-24 19:06:07 -0700
+ Commit: 8ca4176, github.com/apache/spark/pull/1132
+
+ [SPARK-2264][SQL] Fix failing CachedTableSuite
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-24 19:04:29 -0700
+ Commit: a162c9b, github.com/apache/spark/pull/1201
+
+ Fix broken Json tests.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-24 16:54:50 -0700
+ Commit: 1978a90, github.com/apache/spark/pull/1198
+
+ HOTFIX: Disabling tests per SPARK-2264
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-24 15:09:30 -0700
+ Commit: 221909e
+
+ SPARK-1937: fix issue with task locality
+ Rui Li <rui.li@intel.com>, lirui-intel <rui.li@intel.com>
+ 2014-06-24 11:40:37 -0700
+ Commit: 924b708, github.com/apache/spark/pull/892
+
+ [SPARK-2252] Fix MathJax for HTTPs.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-23 23:18:47 -0700
+ Commit: 420c1c3, github.com/apache/spark/pull/1189
+
+ [SPARK-2124] Move aggregation into shuffle implementations
+ jerryshao <saisai.shao@intel.com>
+ 2014-06-23 20:25:46 -0700
+ Commit: 56eb8af, github.com/apache/spark/pull/1064
+
+ [SPARK-2227] Support dfs command in SQL.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-23 18:34:54 -0700
+ Commit: 51c8168, github.com/apache/spark/pull/1167
+
+ Cleanup on Connection, ConnectionManagerId, ConnectionManager classes part 2
+ Henry Saputra <henry.saputra@gmail.com>
+ 2014-06-23 17:13:26 -0700
+ Commit: 383bf72, github.com/apache/spark/pull/1157
+
+ [SPARK-1768] History server enhancements.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-23 13:53:44 -0700
+ Commit: 21ddd7d, github.com/apache/spark/pull/718
+
+ [SPARK-2118] spark class should complain if tools jar is missing.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-06-23 13:35:09 -0700
+ Commit: 6dc6722, github.com/apache/spark/pull/1068
+
+ [SPARK-1669][SQL] Made cacheTable idempotent
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-23 13:24:33 -0700
+ Commit: a4bc442, github.com/apache/spark/pull/1183
+
+ Fix mvn detection
+ Matthew Farrellee <matt@redhat.com>
+ 2014-06-23 11:24:05 -0700
+ Commit: 853a2b9, github.com/apache/spark/pull/1181
+
+ Fixed small running on YARN docs typo
+ Vlad <frolvlad@gmail.com>
+ 2014-06-23 10:55:49 -0500
+ Commit: b88238f, github.com/apache/spark/pull/1158
+
+ [SPARK-1395] Fix "local:" URI support in Yarn mode (again).
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-23 08:51:11 -0500
+ Commit: e380767, github.com/apache/spark/pull/560
+
+ SPARK-2166 - Listing of instances to be terminated before the prompt
+ Jean-Martin Archer <jeanmartin.archer@pulseenergy.com>
+ 2014-06-22 20:52:02 -0700
+ Commit: 9cb64b2, github.com/apache/spark/pull/270
+
+ SPARK-2241: quote command line args in ec2 script
+ Ori Kremer <ori.kremer@gmail.com>
+ 2014-06-22 20:21:23 -0700
+ Commit: 9fc373e, github.com/apache/spark/pull/1169
+
+ SPARK-2229: FileAppender throw an llegalArgumentException in jdk6
+ witgo <witgo@qq.com>
+ 2014-06-22 18:25:16 -0700
+ Commit: 409d24e, github.com/apache/spark/pull/1174
+
+ SPARK-1316. Remove use of Commons IO
+ Sean Owen <sowen@cloudera.com>
+ 2014-06-22 11:47:49 -0700
+ Commit: 9fe28c3, github.com/apache/spark/pull/1173
+
+ SPARK-2034. KafkaInputDStream doesn't close resources and may prevent JVM shutdown
+ Sean Owen <sowen@cloudera.com>
+ 2014-06-22 01:12:15 -0700
+ Commit: 476581e, github.com/apache/spark/pull/980
+
+ SPARK-2231: dev/run-tests should include YARN and use a recent Hadoop version
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-22 00:55:27 -0700
+ Commit: 58b32f3, github.com/apache/spark/pull/1175
+
+ SPARK-1996. Remove use of special Maven repo for Akka
+ Sean Owen <sowen@cloudera.com>
+ 2014-06-21 23:29:57 -0700
+ Commit: 1db9cbc, github.com/apache/spark/pull/1170
+
+ HOTFIX: Add excludes for new MIMA files
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-21 15:20:15 -0700
+ Commit: 3e0b078
+
+ HOTFIX: Fix missing MIMA ignore
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-21 13:02:49 -0700
+ Commit: 0a432d6
+
+ [SQL] Break hiveOperators.scala into multiple files.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-21 12:04:18 -0700
+ Commit: ec935ab, github.com/apache/spark/pull/1166
+
+ [SQL] Pass SQLContext instead of SparkContext into physical operators.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-20 22:49:48 -0700
+ Commit: ca5d8b5, github.com/apache/spark/pull/1164
+
+ Fix some tests.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-20 20:05:12 -0700
+ Commit: 648553d, github.com/apache/spark/pull/917
+
+ [SPARK-2061] Made splits deprecated in JavaRDDLike
+ Anant <anant.asty@gmail.com>
+ 2014-06-20 18:54:00 -0700
+ Commit: 010c460, github.com/apache/spark/pull/1062
+
+ HOTFIX: Fixing style error introduced by 08d0ac
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-20 18:44:54 -0700
+ Commit: a678642
+
+ [SPARK-1970] Update unit test in XORShiftRandomSuite to use ChiSquareTest from commons-math3
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-06-20 18:42:02 -0700
+ Commit: e99903b, github.com/apache/spark/pull/1073
+
+ SPARK-1902 Silence stacktrace from logs when doing port failover to port n+1
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-20 18:25:33 -0700
+ Commit: 08d0aca, github.com/apache/spark/pull/1019
+
+ [SQL] Use hive.SessionState, not the thread local SessionState
+ Aaron Davidson <aaron@databricks.com>
+ 2014-06-20 17:55:54 -0700
+ Commit: 2044784, github.com/apache/spark/pull/1148
+
+ Move ScriptTransformation into the appropriate place.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-20 17:16:56 -0700
+ Commit: d4c7572, github.com/apache/spark/pull/1162
+
+ Clean up CacheManager et al.
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-20 17:14:33 -0700
+ Commit: 01125a1, github.com/apache/spark/pull/1083
+
+ [SPARK-2225] Turn HAVING without GROUP BY into WHERE.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-20 15:38:02 -0700
+ Commit: 0ac71d1, github.com/apache/spark/pull/1161
+
+ SPARK-2180: support HAVING clauses in Hive queries
+ William Benton <willb@redhat.com>
+ 2014-06-20 13:41:38 -0700
+ Commit: 171ebb3, github.com/apache/spark/pull/1136
+
+ SPARK-1868: Users should be allowed to cogroup at least 4 RDDs
+ Allan Douglas R. de Oliveira <allandouglas@gmail.com>
+ 2014-06-20 11:03:03 -0700
+ Commit: 6a224c3, github.com/apache/spark/pull/813
+
+ [SPARK-2163] class LBFGS optimize with Double tolerance instead of Int
+ Gang Bai <me@baigang.net>
+ 2014-06-20 08:52:20 -0700
+ Commit: d484dde, github.com/apache/spark/pull/1104
+
+ [SPARK-2218] rename Equals to EqualTo in Spark SQL expressions.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-20 00:34:59 -0700
+ Commit: 2f6a835, github.com/apache/spark/pull/1146
+
+ [SPARK-2196] [SQL] Fix nullability of CaseWhen.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-20 00:12:52 -0700
+ Commit: 3249528, github.com/apache/spark/pull/1133
+
+ SPARK-2203: PySpark defaults to use same num reduce partitions as map side
+ Aaron Davidson <aaron@databricks.com>
+ 2014-06-20 00:06:57 -0700
+ Commit: f46e02f, github.com/apache/spark/pull/1138
+
+ [SPARK-2209][SQL] Cast shouldn't do null check twice.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-20 00:01:19 -0700
+ Commit: c55bbb4, github.com/apache/spark/pull/1143
+
+ [SPARK-2210] cast to boolean on boolean value gets turned into NOT((boolean_condition) = 0)
+ Reynold Xin <rxin@apache.org>
+ 2014-06-19 23:58:23 -0700
+ Commit: 6175640, github.com/apache/spark/pull/1144
+
+ SPARK-1293 [SQL] Parquet support for nested types
+ Andre Schumacher <andre.schumacher@iki.fi>, Michael Armbrust <michael@databricks.com>
+ 2014-06-19 23:47:45 -0700
+ Commit: f479cf3, github.com/apache/spark/pull/360
+
+ [SPARK-2177][SQL] describe table result contains only one column
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-06-19 23:41:38 -0700
+ Commit: f397e92, github.com/apache/spark/pull/1118
+
+ [SQL] Improve Speed of InsertIntoHiveTable
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-19 23:39:03 -0700
+ Commit: d3b7671, github.com/apache/spark/pull/1130
+
+ More minor scaladoc cleanup for Spark SQL.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-19 22:34:21 -0700
+ Commit: 278ec8a, github.com/apache/spark/pull/1142
+
+ HOTFIX: SPARK-2208 local metrics tests can fail on fast machines
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-19 21:06:28 -0700
+ Commit: e551479, github.com/apache/spark/pull/1141
+
+ A few minor Spark SQL Scaladoc fixes.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-19 18:24:05 -0700
+ Commit: 5464e79, github.com/apache/spark/pull/1139
+
+ [SPARK-2151] Recognize memory format for spark-submit
+ nravi <nravi@c1704.halxg.cloudera.com>
+ 2014-06-19 17:11:06 -0700
+ Commit: f14b00a, github.com/apache/spark/pull/1095
+
+ [SPARK-2191][SQL] Make sure InsertIntoHiveTable doesn't execute more than once.
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-19 14:14:03 -0700
+ Commit: 777c595, github.com/apache/spark/pull/1129
+
+ [SPARK-2051]In yarn.ClientBase spark.yarn.dist.* do not work
+ witgo <witgo@qq.com>
+ 2014-06-19 12:11:26 -0500
+ Commit: bce0897, github.com/apache/spark/pull/969
+
+ Minor fix
+ WangTao <barneystinson@aliyun.com>
+ 2014-06-18 23:24:57 -0700
+ Commit: 67fca18, github.com/apache/spark/pull/1105
+
+ [SPARK-2187] Explain should not run the optimizer twice.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-18 22:44:12 -0700
+ Commit: 640c294, github.com/apache/spark/pull/1123
+
+ Squishing a typo bug before it causes real harm
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-06-18 22:19:06 -0700
+ Commit: 566f70f, github.com/apache/spark/pull/1125
+
+ [SPARK-2184][SQL] AddExchange isn't idempotent
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-18 17:52:42 -0700
+ Commit: 5ff75c7, github.com/apache/spark/pull/1122
+
+ Remove unicode operator from RDD.scala
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-06-18 15:01:29 -0700
+ Commit: 45a95f8, github.com/apache/spark/pull/1119
+
+ SPARK-2158 Clean up core/stdout file from FileAppenderSuite
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-06-18 14:56:41 -0700
+ Commit: 4cbeea8, github.com/apache/spark/pull/1100
+
+ [SPARK-1466] Raise exception if pyspark Gateway process doesn't start.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-18 13:16:26 -0700
+ Commit: 3870248, github.com/apache/spark/pull/383
+
+ Updated the comment for SPARK-2162.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-18 12:48:58 -0700
+ Commit: dd96fcd, github.com/apache/spark/pull/1117
+
+ [SPARK-2162] Double check in doGetLocal to avoid read on removed block.
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-06-18 10:57:45 -0700
+ Commit: 5ad5e34, github.com/apache/spark/pull/1103
+
+ [SPARK-2176][SQL] Extra unnecessary exchange operator in the result of an explain command
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-06-18 10:51:32 -0700
+ Commit: 587d320, github.com/apache/spark/pull/1116
+
+ [STREAMING] SPARK-2009 Key not found exception when slow receiver starts
+ Vadim Chekan <kot.begemot@gmail.com>
+ 2014-06-17 22:03:50 -0700
+ Commit: 889f7b7, github.com/apache/spark/pull/961
+
+ Revert "SPARK-2038: rename "conf" parameters in the saveAsHadoop functions"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-17 19:34:17 -0700
+ Commit: 9e4b4bd
+
+ [SPARK-2060][SQL] Querying JSON Datasets with SQL and DSL in Spark SQL
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-06-17 19:14:59 -0700
+ Commit: d2f4f30, github.com/apache/spark/pull/999
+
+ HOTFIX: bug caused by #941
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-17 15:09:24 -0700
+ Commit: b2ebf42, github.com/apache/spark/pull/1108
+
+ [SPARK-2147 / 2161] Show removed executors on the UI
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-17 12:25:55 -0700
+ Commit: a14807e, github.com/apache/spark/pull/1102
+
+ SPARK-2038: rename "conf" parameters in the saveAsHadoop functions
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-06-17 12:17:48 -0700
+ Commit: 443f5e1, github.com/apache/spark/pull/1087
+
+ SPARK-2146. Fix takeOrdered doc
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-06-17 12:03:22 -0700
+ Commit: 2794990, github.com/apache/spark/pull/1086
+
+ SPARK-1063 Add .sortBy(f) method on RDD
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-17 11:47:48 -0700
+ Commit: b92d16b, github.com/apache/spark/pull/369
+
+ [SPARK-2053][SQL] Add Catalyst expressions for CASE WHEN.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-06-17 13:30:17 +0200
+ Commit: e243c5f, github.com/apache/spark/pull/1055
+
+ [SPARK-2164][SQL] Allow Hive UDF on columns of type struct
+ Xi Liu <xil@conviva.com>
+ 2014-06-17 13:14:40 +0200
+ Commit: f5a4049, github.com/apache/spark/pull/796
+
+ [SPARK-2144] ExecutorsPage reports incorrect # of RDD blocks
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-17 01:28:22 -0700
+ Commit: 09deb3e, github.com/apache/spark/pull/1080
+
+ SPARK-2035: Store call stack for stages, display it on the UI.
+ Daniel Darabos <darabos.daniel@gmail.com>, Patrick Wendell <pwendell@gmail.com>
+ 2014-06-17 00:08:05 -0700
+ Commit: 23a12ce, github.com/apache/spark/pull/981
+
+ SPARK-1990: added compatibility for python 2.6 for ssh_read command
+ Anant <anant.asty@gmail.com>
+ 2014-06-16 23:42:27 -0700
+ Commit: 8cd04c3, github.com/apache/spark/pull/941
+
+ [SPARK-2130] End-user friendly String repr for StorageLevel in Python
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-16 23:31:31 -0700
+ Commit: d81c08b, github.com/apache/spark/pull/1096
+
+ MLlib documentation fix
+ Anatoli Fomenko <fa@apache.org>
+ 2014-06-16 23:10:36 -0700
+ Commit: 7afa912, github.com/apache/spark/pull/1098
+
+ Minor fix: made "EXPLAIN" output to play well with JDBC output format
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-16 16:42:17 -0700
+ Commit: 237b96b, github.com/apache/spark/pull/1097
+
+ [SQL][SPARK-2094] Follow up of PR #1071 for Java API
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-16 21:30:29 +0200
+ Commit: 273afcb, github.com/apache/spark/pull/1085
+
+ [SPARK-1930] The Container is running beyond physical memory limits, so as to be killed
+ witgo <witgo@qq.com>
+ 2014-06-16 14:27:31 -0500
+ Commit: cdf2b04, github.com/apache/spark/pull/894
+
+ [SPARK-2010] Support for nested data in PySpark SQL
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-16 11:11:29 -0700
+ Commit: 4fdb491, github.com/apache/spark/pull/1041
+
+ SPARK-2039: apply output dir existence checking for all output formats
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-06-15 23:47:58 -0700
+ Commit: 716c88a, github.com/apache/spark/pull/1088
+
+ Updating docs to include missing information about reducers and clarify ...
+ Ali Ghodsi <alig@cs.berkeley.edu>
+ 2014-06-15 23:44:30 -0700
+ Commit: 119b06a, github.com/apache/spark/pull/1089
+
+ SPARK-2148 Add link to requirements for custom equals() and hashcode() methods
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-15 23:32:55 -0700
+ Commit: 9672ee0, github.com/apache/spark/pull/1092
+
+ SPARK-1999: StorageLevel in storage tab and RDD Storage Info never changes
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-06-15 23:23:26 -0700
+ Commit: a63aa1a, github.com/apache/spark/pull/968
+
+ [SPARK-937] adding EXITED executor state and not relaunching cleanly exited executors
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-15 14:55:34 -0700
+ Commit: ca5d9d4, github.com/apache/spark/pull/306
+
+ [SQL] Support transforming TreeNodes with Option children.
+ Michael Armbrust <michael@databricks.com>, Zongheng Yang <zongheng.y@gmail.com>
+ 2014-06-15 11:28:34 +0200
+ Commit: 269fc62, github.com/apache/spark/pull/1074
+
+ [SPARK-1837] NumericRange should be partitioned in the same way as other...
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-14 14:31:28 -0700
+ Commit: 7dd9fc6, github.com/apache/spark/pull/776
+
+ [SPARK-2013] Documentation for saveAsPickleFile and pickleFile in Python
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-14 13:22:30 -0700
+ Commit: b52603b, github.com/apache/spark/pull/983
+
+ [SPARK-2079] Support batching when serializing SchemaRDD to Python
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-14 13:17:22 -0700
+ Commit: 2550533, github.com/apache/spark/pull/1023
+
+ [Spark-2137][SQL] Timestamp UDFs broken
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-06-13 23:28:57 -0700
+ Commit: 8919685, github.com/apache/spark/pull/1081
+
+ Small correction in Streaming Programming Guide doc
+ akkomar <ak.komar@gmail.com>
+ 2014-06-13 15:37:26 -0700
+ Commit: edb1f0e, github.com/apache/spark/pull/1079
+
+ [SPARK-2094][SQL] "Exactly once" semantics for DDL and command statements
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-13 12:59:48 -0700
+ Commit: ac96d96, github.com/apache/spark/pull/1071
+
+ [SPARK-1964][SQL] Add timestamp to HiveMetastoreTypes.toMetastoreType
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-13 12:55:15 -0700
+ Commit: 1c2fd01, github.com/apache/spark/pull/1061
+
+ Workaround in Spark for ConcurrentModification issue (JIRA Hadoop-10456, Spark-1097)
+ nravi <nravi@c1704.halxg.cloudera.com>
+ 2014-06-13 10:52:21 -0700
+ Commit: 70c8116, github.com/apache/spark/pull/1000
+
+ [HOTFIX] add math3 version to pom
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-13 02:59:38 -0700
+ Commit: b3736e3, github.com/apache/spark/pull/1075
+
+ [SPARK-2135][SQL] Use planner for in-memory scans
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-12 23:09:41 -0700
+ Commit: 13f8cfd, github.com/apache/spark/pull/1072
+
+ [SPARK-1516]Throw exception in yarn client instead of run system.exit directly.
+ John Zhao <jzhao@alpinenow.com>
+ 2014-06-12 21:39:00 -0700
+ Commit: f95ac68, github.com/apache/spark/pull/490
+
+ [Minor] Fix style, formatting and naming in BlockManager etc.
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-12 20:40:58 -0700
+ Commit: 44daec5, github.com/apache/spark/pull/1058
+
+ SPARK-1939 Refactor takeSample method in RDD to use ScaSRS
+ Doris Xin <doris.s.xin@gmail.com>, dorx <doris.s.xin@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-06-12 19:44:27 -0700
+ Commit: 1de1d70, github.com/apache/spark/pull/916
+
+ document laziness of parallelize
+ Ariel Rabkin <asrabkin@cs.princeton.edu>
+ 2014-06-12 17:51:33 -0700
+ Commit: 0154587, github.com/apache/spark/pull/1070
+
+ SPARK-2085: [MLlib] Apply user-specific regularization instead of uniform regularization in ALS
+ Shuo Xiang <sxiang@twitter.com>
+ 2014-06-12 17:37:06 -0700
+ Commit: a6e0afd, github.com/apache/spark/pull/1026
+
+ SPARK-1843: Replace assemble-deps with env variable.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-12 15:43:32 -0700
+ Commit: 1c04652, github.com/apache/spark/pull/877
+
+ [SPARK-2080] Yarn: report HS URL in client mode, correct user in cluster mode.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-12 16:19:36 -0500
+ Commit: ecde5b8, github.com/apache/spark/pull/1002
+
+ [SPARK-2088] fix NPE in toString
+ Doris Xin <doris.s.xin@gmail.com>
+ 2014-06-12 12:53:07 -0700
+ Commit: 83c226d, github.com/apache/spark/pull/1028
+
+ SPARK-554. Add aggregateByKey.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-06-12 08:14:25 -0700
+ Commit: ce92a9c, github.com/apache/spark/pull/705
+
+ fixed typo in docstring for min()
+ Jeff Thompson <jeffreykeatingthompson@gmail.com>
+ 2014-06-12 08:10:51 -0700
+ Commit: 43d53d5, github.com/apache/spark/pull/1065
+
+ Cleanup on Connection and ConnectionManager
+ Henry Saputra <henry.saputra@gmail.com>
+ 2014-06-11 23:17:51 -0700
+ Commit: 4d8ae70, github.com/apache/spark/pull/1060
+
+ 'killFuture' is never used
+ Yadong <qiyadong2010@gmail.com>
+ 2014-06-11 20:58:39 -0700
+ Commit: e056320, github.com/apache/spark/pull/1052
+
+ [SPARK-2044] Pluggable interface for shuffles
+ Matei Zaharia <matei@databricks.com>
+ 2014-06-11 20:45:29 -0700
+ Commit: 508fd37, github.com/apache/spark/pull/1009
+
+ [SPARK-1672][MLLIB] Separate user and product partitioning in ALS
+ Tor Myklebust <tmyklebu@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-06-11 18:16:33 -0700
+ Commit: d920335, github.com/apache/spark/pull/1014
+
+ [SPARK-2052] [SQL] Add optimization for CaseConversionExpression's.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-11 17:58:35 -0700
+ Commit: 9a2448d, github.com/apache/spark/pull/990
+
+ HOTFIX: Forgot to remove false change in previous commit
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-11 15:55:41 -0700
+ Commit: d45e0c6
+
+ HOTFIX: PySpark tests should be order insensitive.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-11 15:54:41 -0700
+ Commit: 14e6dc9, github.com/apache/spark/pull/1054
+
+ HOTFIX: A few PySpark tests were not actually run
+ Andrew Or <andrewor14@gmail.com>
+ 2014-06-11 12:11:46 -0700
+ Commit: fe78b8b, github.com/apache/spark/pull/1053
+
+ [SQL] Code Cleanup: Left Semi Hash Join
+ Daoyuan <daoyuan.wang@intel.com>
+ 2014-06-11 12:08:28 -0700
+ Commit: ce6deb1, github.com/apache/spark/pull/1049
+
+ [SPARK-2042] Prevent unnecessary shuffle triggered by take()
+ Sameer Agarwal <sameer@databricks.com>
+ 2014-06-11 12:01:04 -0700
+ Commit: 4107cce, github.com/apache/spark/pull/1048
+
+ SPARK-2113: awaitTermination() after stop() will hang in Spark Stremaing
+ Lars Albertsson <lalle@spotify.com>
+ 2014-06-11 10:54:42 -0700
+ Commit: 4d5c12a, github.com/apache/spark/pull/1001
+
+ [SPARK-2108] Mark SparkContext methods that return block information as developer API's
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-06-11 10:49:34 -0700
+ Commit: e508f59, github.com/apache/spark/pull/1047
+
+ [SPARK-2069] MIMA false positives
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-06-11 10:47:06 -0700
+ Commit: 5b754b4, github.com/apache/spark/pull/1021
+
+ SPARK-1639. Tidy up some Spark on YARN code
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-06-11 07:57:28 -0500
+ Commit: 2a4225d, github.com/apache/spark/pull/561
+
+ SPARK-2107: FilterPushdownSuite doesn't need Junit jar.
+ Qiuzhuang.Lian <Qiuzhuang.Lian@gmail.com>
+ 2014-06-11 00:36:06 -0700
+ Commit: 6e11930, github.com/apache/spark/pull/1046
+
+ [SPARK-2091][MLLIB] use numpy.dot instead of ndarray.dot
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-11 00:22:40 -0700
+ Commit: 0f1dc3a, github.com/apache/spark/pull/1035
+
+ [SPARK-1968][SQL] SQL/HiveQL command for caching/uncaching tables
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-11 00:06:50 -0700
+ Commit: 0266a0c, github.com/apache/spark/pull/1038
+
+ [SPARK-2093] [SQL] NullPropagation should use exact type value.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-10 23:13:48 -0700
+ Commit: 0402bd7, github.com/apache/spark/pull/1034
+
+ HOTFIX: clear() configs in SQLConf-related unit tests.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-06-10 21:59:01 -0700
+ Commit: 601032f, github.com/apache/spark/pull/1040
+
+ [SPARK-2065] give launched instances names
+ Nicholas Chammas <nicholas.chammas@gmail.com>, nchammas <nicholas.chammas@gmail.com>
+ 2014-06-10 21:49:08 -0700
+ Commit: a2052a4, github.com/apache/spark/pull/1043
+
+ Resolve scalatest warnings during build
+ witgo <witgo@qq.com>
+ 2014-06-10 20:24:05 -0700
+ Commit: c48b622, github.com/apache/spark/pull/1032
+
+ [SPARK-1940] Enabling rolling of executor logs, and automatic cleanup of old executor logs
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-06-10 20:22:02 -0700
+ Commit: 4823bf4, github.com/apache/spark/pull/895
+
+ [SPARK-1998] SparkFlumeEvent with body bigger than 1020 bytes are not re...
+ joyyoj <sunshch@gmail.com>
+ 2014-06-10 17:26:17 -0700
+ Commit: 2966044, github.com/apache/spark/pull/951
+
+ [SQL] Add average overflow test case from #978
+ egraldlo <egraldlo@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-06-10 14:07:55 -0700
+ Commit: 1abbde0, github.com/apache/spark/pull/1033
+
+ HOTFIX: Increase time limit for Bagel test
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-06-10 13:15:06 -0700
+ Commit: 55a0e87, github.com/apache/spark/pull/1037
+
+ HOTFIX: Fix Python tests on Jenkins.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-10 13:13:17 -0700
+ Commit: fb499be, github.com/apache/spark/pull/1036
+
+ [SPARK-2076][SQL] Pushdown the join filter & predication for outer join
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-06-10 12:59:52 -0700
+ Commit: db0c038, github.com/apache/spark/pull/1015
+
+ [SPARK-1978] In some cases, spark-yarn does not automatically restart the failed container
+ witgo <witgo@qq.com>
+ 2014-06-10 10:34:57 -0500
+ Commit: 884ca71, github.com/apache/spark/pull/921
+
+ Moved hiveOperators.scala to the right package folder
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-10 01:14:44 -0700
+ Commit: a9a461c, github.com/apache/spark/pull/1029
+
+ [SPARK-1508][SQL] Add SQLConf to SQLContext.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-06-10 00:49:09 -0700
+ Commit: 08ed9ad, github.com/apache/spark/pull/956
+
+ SPARK-1416: PySpark support for SequenceFile and Hadoop InputFormats
+ Nick Pentreath <nick.pentreath@gmail.com>
+ 2014-06-09 22:21:03 -0700
+ Commit: f971d6c, github.com/apache/spark/pull/455
+
+ Make sure that empty string is filtered out when we get the secondary jars from conf
+ DB Tsai <dbtsai@dbtsai.com>
+ 2014-06-09 22:18:50 -0700
+ Commit: 6f2db8c, github.com/apache/spark/pull/1027
+
+ [SPARK-1704][SQL] Fully support EXPLAIN commands as SchemaRDD.
+ Zongheng Yang <zongheng.y@gmail.com>
+ 2014-06-09 16:47:44 -0700
+ Commit: a9ec033, github.com/apache/spark/pull/1003
+
+ [SQL] Simple framework for debugging query execution
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-09 14:24:19 -0700
+ Commit: c6e041d, github.com/apache/spark/pull/1005
+
+ [SPARK-1522] : YARN ClientBase throws a NPE if there is no YARN Application CP
+ Bernardo Gomez Palacio <bernardo.gomezpalacio@gmail.com>
+ 2014-06-09 16:14:54 -0500
+ Commit: e273447, github.com/apache/spark/pull/433
+
+ Added a TaskSetManager unit test.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-06-09 13:13:53 -0700
+ Commit: 6cf335d, github.com/apache/spark/pull/1024
+
+ [SPARK-1495][SQL]add support for left semi join
+ Daoyuan <daoyuan.wang@intel.com>, Michael Armbrust <michael@databricks.com>, Daoyuan Wang <daoyuan.wang@intel.com>
+ 2014-06-09 11:31:36 -0700
+ Commit: 0cf6002, github.com/apache/spark/pull/837
+
+ SPARK-1944 Document --verbose in spark-shell -h
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-09 10:21:21 -0700
+ Commit: 35630c8, github.com/apache/spark/pull/1020
+
+ [SPARK-1308] Add getNumPartitions to pyspark RDD
+ Syed Hashmi <shashmi@cloudera.com>
+ 2014-06-09 00:08:40 -0700
+ Commit: 6113ac1, github.com/apache/spark/pull/995
+
+ Grammar: read -> reads
+ Andrew Ash <andrew@andrewash.com>
+ 2014-06-08 23:20:10 -0700
+ Commit: 32ee9f0, github.com/apache/spark/pull/1016
+
+ [SPARK-2067] use relative path for Spark logo in UI
+ Neville Li <neville@spotify.com>
+ 2014-06-08 23:18:27 -0700
+ Commit: 15ddbef, github.com/apache/spark/pull/1006
+
+ SPARK-1628 follow up: Improve RangePartitioner's documentation.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-08 18:39:57 -0700
+ Commit: 219dc00, github.com/apache/spark/pull/1012
+
+ Update run-example
+ maji2014 <maji3@asiainfo-linkage.com>
+ 2014-06-08 15:14:27 -0700
+ Commit: e9261d0, github.com/apache/spark/pull/1011
+
+ SPARK-1628: Add missing hashCode methods in Partitioner subclasses
+ zsxwing <zsxwing@gmail.com>
+ 2014-06-08 14:18:52 -0700
+ Commit: a71c6d1, github.com/apache/spark/pull/549
+
+ SPARK-1898: In deploy.yarn.Client, use YarnClient not YarnClientImpl
+ Colin Patrick McCabe <cmccabe@cloudera.com>
+ 2014-06-08 12:27:34 -0700
+ Commit: ee96e94, github.com/apache/spark/pull/850
+
+ SPARK-2026: Maven Hadoop Profiles Should Set The Hadoop Version
+ Bernardo Gomez Palacio <bernardo.gomezpalacio@gmail.com>
+ 2014-06-08 01:24:52 -0700
+ Commit: a338834, github.com/apache/spark/pull/998
+
+ SPARK-2056 Set RDD name to input path
+ Neville Li <neville@spotify.com>
+ 2014-06-07 16:22:26 -0700
+ Commit: 7b877b2, github.com/apache/spark/pull/992
+
+ HOTFIX: Support empty body in merge script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-07 16:16:37 -0700
+ Commit: 3ace10d, github.com/apache/spark/pull/1007
+
+ [SPARK-1994][SQL] Weird data corruption bug when running Spark SQL on data in HDFS
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-07 14:20:33 -0700
+ Commit: a6c72ab, github.com/apache/spark/pull/1004
+
+ [SPARK-1841]: update scalatest to version 2.1.5
+ witgo <witgo@qq.com>
+ 2014-06-06 11:45:21 -0700
+ Commit: 41c4a33, github.com/apache/spark/pull/713
+
+ [SPARK-2050 - 2][SQL] DIV and BETWEEN should not be case sensitive.
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-06 11:31:37 -0700
+ Commit: 8d21056, github.com/apache/spark/pull/994
+
+ [SPARK-1552] Fix type comparison bug in {map,outerJoin}Vertices
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-06-05 23:33:12 -0700
+ Commit: 8d85359, github.com/apache/spark/pull/967
+
+ [SPARK-2050][SQL] LIKE, RLIKE and IN in HQL should not be case sensitive.
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-05 23:20:59 -0700
+ Commit: 41db44c, github.com/apache/spark/pull/989
+
+ SPARK-2043: ExternalAppendOnlyMap doesn't always find matching keys
+ Matei Zaharia <matei@databricks.com>
+ 2014-06-05 23:01:48 -0700
+ Commit: b45c13e, github.com/apache/spark/pull/986
+
+ [SPARK-2025] Unpersist edges of previous graph in Pregel
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-06-05 17:45:38 -0700
+ Commit: 9bad0b7, github.com/apache/spark/pull/972
+
+ Use pluggable clock in DAGSheduler #SPARK-2031
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-06-05 17:44:46 -0700
+ Commit: 3d3f8c8, github.com/apache/spark/pull/976
+
+ [SPARK-2041][SQL] Correctly analyze queries where columnName == tableName.
+ Michael Armbrust <michael@databricks.com>
+ 2014-06-05 17:42:08 -0700
+ Commit: c7a183b, github.com/apache/spark/pull/985
+
+ Remove compile-scoped junit dependency.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-05 13:13:33 -0700
+ Commit: 668cb1d, github.com/apache/spark/pull/794
+
+ sbt 0.13.X should be using sbt-assembly 0.11.X
+ Kalpit Shah <shahkalpit84@gmail.com>
+ 2014-06-05 13:07:26 -0700
+ Commit: 5473aa7, github.com/apache/spark/pull/555
+
+ HOTFIX: Remove generated-mima-excludes file after runing MIMA.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-05 13:06:46 -0700
+ Commit: f6143f1, github.com/apache/spark/pull/971
+
+ [SPARK-2036] [SQL] CaseConversionExpression should check if the evaluated value is null.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-05 12:00:31 -0700
+ Commit: e4c11ee, github.com/apache/spark/pull/982
+
+ SPARK-1677: allow user to disable output dir existence checking
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-06-05 11:39:35 -0700
+ Commit: 89cdbb0, github.com/apache/spark/pull/947
+
+ [SPARK-2029] Bump pom.xml version number of master branch to 1.1.0-SNAPSHOT.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-06-05 11:27:33 -0700
+ Commit: 7c16029, github.com/apache/spark/pull/974
+
+ Fix issue in ReplSuite with hadoop-provided profile.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-06-04 22:56:49 -0700
+ Commit: b77c19b, github.com/apache/spark/pull/781
+
+ Minor: Fix documentation error from apache/spark#946
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-06-04 16:45:53 -0700
+ Commit: abea2d4, github.com/apache/spark/pull/970
+
+ SPARK-1790: Update EC2 scripts to support r3 instance types
+ Varakhedi Sujeet <svarakhedi@gopivotal.com>
+ 2014-06-04 16:01:56 -0700
+ Commit: 11ded3f, github.com/apache/spark/pull/960
+
+ SPARK-1518: FileLogger: Fix compile against Hadoop trunk
+ Colin McCabe <cmccabe@cloudera.com>
+ 2014-06-04 15:56:29 -0700
+ Commit: 1765c8d, github.com/apache/spark/pull/898
+
+ [SPARK-1752][MLLIB] Standardize text format for vectors and labeled points
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-04 12:56:56 -0700
+ Commit: 189df16, github.com/apache/spark/pull/685
+
+ SPARK-1973. Add randomSplit to JavaRDD (with tests, and tidy Java tests)
+ Sean Owen <sowen@cloudera.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-06-04 11:27:08 -0700
+ Commit: d341b17, github.com/apache/spark/pull/919
+
+ [MLLIB] set RDD names in ALS
+ Neville Li <neville@spotify.com>
+ 2014-06-04 01:51:34 -0700
+ Commit: b8d2580, github.com/apache/spark/pull/966
+
+ [SPARK-1817] RDD.zip() should verify partition sizes for each partition
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-03 22:47:18 -0700
+ Commit: c402a4a, github.com/apache/spark/pull/944
+
+ SPARK-1806 (addendum) Use non-deprecated methods in Mesos 0.18
+ Sean Owen <sowen@cloudera.com>
+ 2014-06-03 22:37:20 -0700
+ Commit: 4ca0625, github.com/apache/spark/pull/920
+
+ Update spark-ec2 scripts for 1.0.0 on master
+ Aaron Davidson <aaron@databricks.com>
+ 2014-06-03 22:33:04 -0700
+ Commit: ab7c62d, github.com/apache/spark/pull/938
+
+ Enable repartitioning of graph over different number of partitions
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-06-03 20:49:14 -0700
+ Commit: 5284ca7, github.com/apache/spark/pull/719
+
+ use env default python in merge_spark_pr.py
+ Xiangrui Meng <meng@databricks.com>
+ 2014-06-03 18:53:13 -0700
+ Commit: e8d93ee, github.com/apache/spark/pull/965
+
+ SPARK-1941: Update streamlib to 2.7.0 and use HyperLogLogPlus instead of HyperLogLog.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-03 18:37:40 -0700
+ Commit: 1faef14, github.com/apache/spark/pull/897
+
+ [SPARK-1161] Add saveAsPickleFile and SparkContext.pickleFile in Python
+ Kan Zhang <kzhang@apache.org>
+ 2014-06-03 18:18:25 -0700
+ Commit: 21e40ed, github.com/apache/spark/pull/755
+
+ Fixed a typo
+ DB Tsai <dbtsai@dbtsai.com>
+ 2014-06-03 18:10:58 -0700
+ Commit: f4dd665, github.com/apache/spark/pull/959
+
+ [SPARK-1991] Support custom storage levels for vertices and edges
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-06-03 14:54:26 -0700
+ Commit: b1feb60, github.com/apache/spark/pull/946
+
+ Synthetic GraphX Benchmark
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>, Ankur Dave <ankurdave@gmail.com>
+ 2014-06-03 14:14:48 -0700
+ Commit: 894ecde, github.com/apache/spark/pull/720
+
+ fix java.lang.ClassCastException
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-06-03 13:39:47 -0700
+ Commit: aa41a52, github.com/apache/spark/pull/949
+
+ [SPARK-1468] Modify the partition function used by partitionBy.
+ Erik Selin <erik.selin@jadedpixel.com>
+ 2014-06-03 13:31:16 -0700
+ Commit: 8edc9d0, github.com/apache/spark/pull/371
+
+ Add support for Pivotal HD in the Maven build: SPARK-1992
+ tzolov <christian.tzolov@gmail.com>
+ 2014-06-03 13:26:29 -0700
+ Commit: b1f2853, github.com/apache/spark/pull/942
+
+ [SPARK-1912] fix compress memory issue during reduce
+ Wenchen Fan(Cloud) <cloud0fan@gmail.com>
+ 2014-06-03 13:18:20 -0700
+ Commit: 45e9bc8, github.com/apache/spark/pull/860
+
+ SPARK-2001 : Remove docs/spark-debugger.md from master
+ Henry Saputra <henry.saputra@gmail.com>
+ 2014-06-03 13:03:51 -0700
+ Commit: 6c044ed, github.com/apache/spark/pull/953
+
+ [SPARK-1942] Stop clearing spark.driver.port in unit tests
+ Syed Hashmi <shashmi@cloudera.com>, CodingCat <zhunansjtu@gmail.com>
+ 2014-06-03 12:04:47 -0700
+ Commit: 7782a30, github.com/apache/spark/pull/943
+
+ Avoid dynamic dispatching when unwrapping Hive data.
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-02 19:20:23 -0700
+ Commit: 862283e, github.com/apache/spark/pull/935
+
+ [SPARK-1995][SQL] system function upper and lower can be supported
+ egraldlo <egraldlo@gmail.com>
+ 2014-06-02 18:02:57 -0700
+ Commit: ec8be27, github.com/apache/spark/pull/936
+
+ [SPARK-1958] Calling .collect() on a SchemaRDD should call executeCollect() on the underlying query plan.
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-06-02 12:09:43 -0700
+ Commit: d000ca9, github.com/apache/spark/pull/939
+
+ [SPARK-1553] Alternating nonnegative least-squares
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-06-02 11:48:09 -0700
+ Commit: 9a5d482, github.com/apache/spark/pull/460
+
+ Add landmark-based Shortest Path algorithm to graphx.lib
+ Ankur Dave <ankurdave@gmail.com>, Andres Perez <andres@tresata.com>
+ 2014-06-02 00:00:24 -0700
+ Commit: 9535f40, github.com/apache/spark/pull/933
+
+ Better explanation for how to use MIMA excludes.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-06-01 17:27:05 -0700
+ Commit: d17d221, github.com/apache/spark/pull/937
+
+ Made spark_ec2.py PEP8 compliant.
+ Reynold Xin <rxin@apache.org>
+ 2014-06-01 15:39:04 -0700
+ Commit: eea3aab, github.com/apache/spark/pull/891
+
+ updated java code blocks in spark SQL guide such that ctx will refer to ...
+ Yadid Ayzenberg <yadid@media.mit.edu>
+ 2014-05-31 19:44:13 -0700
+ Commit: 366c0c4, github.com/apache/spark/pull/932
+
+ SPARK-1917: fix PySpark import of scipy.special functions
+ Uri Laserson <laserson@cloudera.com>
+ 2014-05-31 14:59:09 -0700
+ Commit: 5e98967, github.com/apache/spark/pull/866
+
+ Improve maven plugin configuration
+ witgo <witgo@qq.com>
+ 2014-05-31 14:36:27 -0700
+ Commit: d8c005d, github.com/apache/spark/pull/786
+
+ SPARK-1839: PySpark RDD#take() shouldn't always read from driver
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-31 13:04:57 -0700
+ Commit: 9909efc, github.com/apache/spark/pull/922
+
+ Super minor: Close inputStream in SparkSubmitArguments
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-31 12:36:58 -0700
+ Commit: 7d52777, github.com/apache/spark/pull/914
+
+ [SQL] SPARK-1964 Add timestamp to hive metastore type parser.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-31 12:34:22 -0700
+ Commit: 1a0da0e, github.com/apache/spark/pull/913
+
+ Optionally include Hive as a dependency of the REPL.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-31 12:24:35 -0700
+ Commit: 7463cd2, github.com/apache/spark/pull/801
+
+ [SPARK-1947] [SQL] Child of SumDistinct or Average should be widened to prevent overflows the same as Sum.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-31 11:30:03 -0700
+ Commit: 3ce8149, github.com/apache/spark/pull/902
+
+ correct tiny comment error
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-05-31 00:06:49 -0700
+ Commit: 9ecc40d, github.com/apache/spark/pull/928
+
+ [SPARK-1959] String "NULL" shouldn't be interpreted as null value
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-30 22:13:11 -0700
+ Commit: cf98960, github.com/apache/spark/pull/909
+
+ SPARK-1976: fix the misleading part in streaming docs
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-05-30 22:06:08 -0700
+ Commit: 41bfdda, github.com/apache/spark/pull/924
+
+ updated link to mailing list
+ nchammas <nicholas.chammas@gmail.com>
+ 2014-05-30 22:04:57 -0700
+ Commit: 23ae366, github.com/apache/spark/pull/923
+
+ Typo: and -> an
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-30 22:02:04 -0700
+ Commit: 9c1f204, github.com/apache/spark/pull/927
+
+ [SPARK-1901] worker should make sure executor has exited before updating executor's info
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-30 10:11:02 -0700
+ Commit: ff562b2, github.com/apache/spark/pull/854
+
+ [SPARK-1971] Update MIMA to compare against Spark 1.0.0
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-30 01:13:51 -0700
+ Commit: 79fa8fd, github.com/apache/spark/pull/910
+
+ [SPARK-1566] consolidate programming guide, and general doc updates
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-30 00:34:33 -0700
+ Commit: c8bf413, github.com/apache/spark/pull/896
+
+ [SPARK-1820] Make GenerateMimaIgnore @DeveloperApi annotation aware.
+ Prashant Sharma <prashant.s@imaginea.com>, nikhil7sh <nikhilsharmalnmiit@gmail.ccom>
+ 2014-05-29 23:20:20 -0700
+ Commit: eeee978, github.com/apache/spark/pull/904
+
+ initial version of LPA
+ Ankur Dave <ankurdave@gmail.com>, haroldsultan <haroldsultan@gmail.com>, Harold Sultan <haroldsultan@gmail.com>
+ 2014-05-29 15:39:25 -0700
+ Commit: b7e28fa, github.com/apache/spark/pull/905
+
+ [SPARK-1368][SQL] Optimized HiveTableScan
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-29 15:24:03 -0700
+ Commit: 8f7141f, github.com/apache/spark/pull/758
+
+ SPARK-1935: Explicitly add commons-codec 1.5 as a dependency.
+ Yin Huai <huai@cse.ohio-state.edu>
+ 2014-05-29 09:07:39 -0700
+ Commit: 60b89fe, github.com/apache/spark/pull/889
+
+ Added doctest and method description in context.py
+ Jyotiska NK <jyotiska123@gmail.com>
+ 2014-05-28 23:08:39 -0700
+ Commit: 9cff1dd, github.com/apache/spark/pull/187
+
+ [SPARK-1712]: TaskDescription instance is too big causes Spark to hang
+ witgo <witgo@qq.com>
+ 2014-05-28 15:57:05 -0700
+ Commit: 4dbb27b, github.com/apache/spark/pull/694
+
+ Spark 1916
+ David Lemieux <david.lemieux@radialpoint.com>
+ 2014-05-28 15:50:35 -0700
+ Commit: 4312cf0, github.com/apache/spark/pull/865
+
+ Organize configuration docs
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-28 15:49:54 -0700
+ Commit: 7801d44, github.com/apache/spark/pull/880
+
+ Fix doc about NetworkWordCount/JavaNetworkWordCount usage of spark streaming
+ jmu <jmujmu@gmail.com>
+ 2014-05-27 22:41:47 -0700
+ Commit: 82eadc3, github.com/apache/spark/pull/826
+
+ [SPARK-1938] [SQL] ApproxCountDistinctMergeFunction should return Int value.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-27 22:17:50 -0700
+ Commit: 9df8683, github.com/apache/spark/pull/893
+
+ [SQL] SPARK-1922
+ LY Lai <ly.lai@vpon.com>
+ 2014-05-27 16:08:38 -0700
+ Commit: 0682567, github.com/apache/spark/pull/873
+
+ [SPARK-1915] [SQL] AverageFunction should not count if the evaluated value is null.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-27 14:55:23 -0700
+ Commit: 3b0baba, github.com/apache/spark/pull/862
+
+ [SPARK-1926] [SQL] Nullability of Max/Min/First should be true.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-27 14:53:57 -0700
+ Commit: d1375a2, github.com/apache/spark/pull/881
+
+ bugfix worker DriverStateChanged state should match DriverState.FAILED
+ lianhuiwang <lianhuiwang09@gmail.com>
+ 2014-05-27 11:53:38 -0700
+ Commit: 95e4c9c, github.com/apache/spark/pull/864
+
+ SPARK-1932: Fix race conditions in onReceiveCallback and cachedPeers
+ zsxwing <zsxwing@gmail.com>
+ 2014-05-26 23:17:39 -0700
+ Commit: 549830b, github.com/apache/spark/pull/887
+
+ SPARK-1933: Throw a more meaningful exception when a directory is passed to addJar/addFile.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-26 22:05:23 -0700
+ Commit: 90e281b, github.com/apache/spark/pull/888
+
+ Updated dev Python scripts to make them PEP8 compliant.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-26 21:40:52 -0700
+ Commit: 9ed3719, github.com/apache/spark/pull/875
+
+ Fixed the error message for OutOfMemoryError in DAGScheduler.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-26 21:31:27 -0700
+ Commit: ef690e1
+
+ SPARK-1929 DAGScheduler suspended by local task OOM
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-26 21:30:25 -0700
+ Commit: 8d271c9, github.com/apache/spark/pull/883
+
+ [SPARK-1931] Reconstruct routing tables in Graph.partitionBy
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-05-26 16:10:22 -0700
+ Commit: 56c771c, github.com/apache/spark/pull/885
+
+ SPARK-1925: Replace '&' with '&&'
+ zsxwing <zsxwing@gmail.com>
+ 2014-05-26 14:34:58 -0700
+ Commit: cb7fe50, github.com/apache/spark/pull/879
+
+ Fix scalastyle warnings in yarn alpha
+ witgo <witgo@qq.com>
+ 2014-05-26 13:16:35 -0700
+ Commit: bee6c4f, github.com/apache/spark/pull/884
+
+ [SPARK-1914] [SQL] Simplify CountFunction not to traverse to evaluate all child expressions.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-26 00:17:20 -0700
+ Commit: d6395d8, github.com/apache/spark/pull/861
+
+ HOTFIX: Add no-arg SparkContext constructor in Java
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-25 20:13:32 -0700
+ Commit: b6d22af, github.com/apache/spark/pull/878
+
+ [SQL] Minor: Introduce SchemaRDD#aggregate() for simple aggregations
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-25 18:37:44 -0700
+ Commit: c3576ff, github.com/apache/spark/pull/874
+
+ SPARK-1903 Document Spark's network connections
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-25 17:15:47 -0700
+ Commit: 0659529, github.com/apache/spark/pull/856
+
+ Fix PEP8 violations in Python mllib.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 17:15:01 -0700
+ Commit: d33d3c6, github.com/apache/spark/pull/871
+
+ Python docstring update for sql.py.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 16:04:17 -0700
+ Commit: 14f0358, github.com/apache/spark/pull/869
+
+ Fix PEP8 violations in examples/src/main/python.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 14:48:27 -0700
+ Commit: d79c2b2, github.com/apache/spark/pull/870
+
+ Added license header for tox.ini.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:47:08 -0700
+ Commit: 55fddf9
+
+ SPARK-1822: Some minor cleanup work on SchemaRDD.count()
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:44:49 -0700
+ Commit: d66642e, github.com/apache/spark/pull/868
+
+ Added PEP8 style configuration file.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:32:15 -0700
+ Commit: 5c7faec, github.com/apache/spark/pull/872
+
+ [SPARK-1822] SchemaRDD.count() should use query optimizer
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-25 00:06:42 -0700
+ Commit: 6052db9, github.com/apache/spark/pull/841
+
+ spark-submit: add exec at the end of the script
+ Colin Patrick Mccabe <cmccabe@cloudera.com>
+ 2014-05-24 22:39:27 -0700
+ Commit: 6e9fb63, github.com/apache/spark/pull/858
+
+ [SPARK-1913][SQL] Bug fix: column pruning error in Parquet support
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-24 20:42:01 -0700
+ Commit: 5afe6af, github.com/apache/spark/pull/863
+
+ [SPARK-1886] check executor id existence when executor exit
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-24 20:40:19 -0700
+ Commit: 4e4831b, github.com/apache/spark/pull/827
+
+ SPARK-1911: Emphasize that Spark jars should be built with Java 6.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-24 18:27:00 -0700
+ Commit: 75a0327, github.com/apache/spark/pull/859
+
+ [SPARK-1900 / 1918] PySpark on YARN is broken
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-24 18:01:49 -0700
+ Commit: 5081a0a, github.com/apache/spark/pull/853
+
+ Update LBFGSSuite.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-05-23 13:02:40 -0700
+ Commit: a08262d, github.com/apache/spark/pull/815
+
+ Updated scripts for auditing releases
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-22 20:48:55 -0700
+ Commit: b2bdd0e, github.com/apache/spark/pull/844
+
+ [SPARK-1896] Respect spark.master (and --master) before MASTER in spark-shell
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-22 20:32:27 -0700
+ Commit: cce7745, github.com/apache/spark/pull/846
+
+ [SPARK-1897] Respect spark.jars (and --jars) in spark-shell
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-22 20:25:41 -0700
+ Commit: 8edbee7, github.com/apache/spark/pull/849
+
+ Fix UISuite unit test that fails under Jenkins contention
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-22 15:11:05 -0700
+ Commit: f9f5fd5, github.com/apache/spark/pull/857
+
+ [SPARK-1870] Make spark-submit --jars work in yarn-cluster mode.
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-22 01:52:50 -0700
+ Commit: dba3140, github.com/apache/spark/pull/848
+
+ Configuration documentation updates
+ Reynold Xin <rxin@apache.org>
+ 2014-05-21 18:49:12 -0700
+ Commit: 2a948e7, github.com/apache/spark/pull/851
+
+ [SPARK-1889] [SQL] Apply splitConjunctivePredicates to join condition while finding join ke...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-21 15:37:47 -0700
+ Commit: bb88875, github.com/apache/spark/pull/836
+
+ [SPARK-1519] Support minPartitions param of wholeTextFiles() in PySpark
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-21 13:26:53 -0700
+ Commit: f18fd05, github.com/apache/spark/pull/697
+
+ [Typo] Stoped -> Stopped
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 11:59:05 -0700
+ Commit: ba5d4a9, github.com/apache/spark/pull/847
+
+ [Minor] Move JdbcRDDSuite to the correct package
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 01:25:10 -0700
+ Commit: 7c79ef7, github.com/apache/spark/pull/839
+
+ [Docs] Correct example of creating a new SparkConf
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 01:23:34 -0700
+ Commit: 1014668, github.com/apache/spark/pull/842
+
+ [SPARK-1250] Fixed misleading comments in bin/pyspark, bin/spark-class
+ Sumedh Mungee <smungee@gmail.com>
+ 2014-05-21 01:22:25 -0700
+ Commit: 6e33738, github.com/apache/spark/pull/843
+
+ [Hotfix] Blacklisted flaky HiveCompatibility test
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-20 10:27:12 -0700
+ Commit: 7f0cfe4, github.com/apache/spark/pull/838
+
+ [Spark 1877] ClassNotFoundException when loading RDD with serialized objects
+ Tathagata Das <tathagata.das1565@gmail.com>, Ghidireac <bogdang@u448a5b0a73d45358d94a.ant.amazon.com>
+ 2014-05-19 22:36:24 -0700
+ Commit: 52eb54d, github.com/apache/spark/pull/835
+
+ [SPARK-1874][MLLIB] Clean up MLlib sample data
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-19 21:29:33 -0700
+ Commit: bcb9dce, github.com/apache/spark/pull/833
+
+ SPARK-1689: Spark application should die when removed by Master
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-19 20:55:26 -0700
+ Commit: b0ce22e, github.com/apache/spark/pull/832
+
+ [SPARK-1875]NoClassDefFoundError: StringUtils when building with hadoop 1.x and hive
+ witgo <witgo@qq.com>
+ 2014-05-19 19:40:29 -0700
+ Commit: 6a2c5c6, github.com/apache/spark/pull/824
+
+ SPARK-1879. Increase MaxPermSize since some of our builds have many classes
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-19 18:42:28 -0700
+ Commit: 5af99d7, github.com/apache/spark/pull/823
+
+ SPARK-1878: Fix the incorrect initialization order
+ zsxwing <zsxwing@gmail.com>
+ 2014-05-19 16:41:31 -0700
+ Commit: 1811ba8, github.com/apache/spark/pull/822
+
+ [SPARK-1876] Windows fixes to deal with latest distribution layout changes
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-19 15:02:35 -0700
+ Commit: 7b70a70, github.com/apache/spark/pull/819
+
+ [WIP][SPARK-1871][MLLIB] Improve MLlib guide for v1.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-18 17:00:57 -0700
+ Commit: df0aa83, github.com/apache/spark/pull/816
+
+ SPARK-1873: Add README.md file when making distributions
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-18 16:51:53 -0700
+ Commit: 4ce4793, github.com/apache/spark/pull/818
+
+ Fix spark-submit path in spark-shell & pyspark
+ Neville Li <neville@spotify.com>
+ 2014-05-18 13:31:23 -0700
+ Commit: ebcd2d6, github.com/apache/spark/pull/812
+
+ Make deprecation warning less severe
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-16 22:58:47 -0700
+ Commit: 442808a, github.com/apache/spark/pull/810
+
+ [SPARK-1824] Remove <master> from Python examples
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-16 22:36:23 -0700
+ Commit: cf6cbe9, github.com/apache/spark/pull/802
+
+ [SPARK-1808] Route bin/pyspark through Spark submit
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-16 22:34:38 -0700
+ Commit: 4b8ec6f, github.com/apache/spark/pull/799
+
+ Version bump of spark-ec2 scripts
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-16 21:42:14 -0700
+ Commit: c0ab85d, github.com/apache/spark/pull/809
+
+ SPARK-1864 Look in spark conf instead of system properties when propagating configuration to executors.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-16 20:25:10 -0700
+ Commit: a80a6a1, github.com/apache/spark/pull/808
+
+ Tweaks to Mesos docs
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-16 17:35:05 -0700
+ Commit: fed6303, github.com/apache/spark/pull/806
+
+ SPARK-1487 [SQL] Support record filtering via predicate pushdown in Parquet
+ Andre Schumacher <andre.schumacher@iki.fi>
+ 2014-05-16 13:41:41 -0700
+ Commit: 40d6acd, github.com/apache/spark/pull/511
+
+ [SQL] Implement between in hql
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-16 11:47:00 -0700
+ Commit: 032d663, github.com/apache/spark/pull/804
+
+ bugfix: overflow of graphx Edge compare function
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-16 11:37:18 -0700
+ Commit: fa6de40, github.com/apache/spark/pull/769
+
+ HOTFIX: Duplication of hbase version
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-15 23:33:27 -0700
+ Commit: e304eb9
+
+ SPARK-1862: Support for MapR in the Maven build.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-15 23:31:43 -0700
+ Commit: 17702e2, github.com/apache/spark/pull/803
+
+ [Spark-1461] Deferred Expression Evaluation (short-circuit evaluation)
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-05-15 22:12:34 -0700
+ Commit: a20fea9, github.com/apache/spark/pull/446
+
+ SPARK-1860: Do not cleanup application work/ directories by default
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-15 21:37:58 -0700
+ Commit: bb98eca, github.com/apache/spark/pull/800
+
+ Typos in Spark
+ Huajian Mao <huajianmao@gmail.com>
+ 2014-05-15 18:20:16 -0700
+ Commit: 94c5139, github.com/apache/spark/pull/798
+
+ Fixes a misplaced comment.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-15 16:58:37 -0700
+ Commit: e1e3416, github.com/apache/spark/pull/788
+
+ [SQL] Fix tiny/small ints from HiveMetastore.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-15 16:50:42 -0700
+ Commit: a4aafe5, github.com/apache/spark/pull/797
+
+ SPARK-1803 Replaced colon in filenames with a dash
+ Stevo Slavić <sslavic@gmail.com>, Stevo Slavic <sslavic@gmail.com>
+ 2014-05-15 16:44:14 -0700
+ Commit: e66e31b, github.com/apache/spark/pull/739
+
+ SPARK-1851. Upgrade Avro dependency to 1.7.6 so Spark can read Avro file...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-15 16:35:39 -0700
+ Commit: 08e7606, github.com/apache/spark/pull/795
+
+ [SPARK-1741][MLLIB] add predict(JavaRDD) to RegressionModel, ClassificationModel, and KMeans
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-15 11:59:59 -0700
+ Commit: d52761d, github.com/apache/spark/pull/670
+
+ [SPARK-1819] [SQL] Fix GetField.nullable.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-15 11:21:33 -0700
+ Commit: 94c9d6f, github.com/apache/spark/pull/757
+
+ [SPARK-1845] [SQL] Use AllScalaRegistrar for SparkSqlSerializer to register serializers of ...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-15 11:20:21 -0700
+ Commit: db8cc6f, github.com/apache/spark/pull/790
+
+ SPARK-1846 Ignore logs directory in RAT checks
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-15 11:05:39 -0700
+ Commit: 3abe2b7, github.com/apache/spark/pull/793
+
+ HOTFIX: Don't build Javadoc in Maven when creating releases.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 23:48:03 -0700
+ Commit: 514157f
+
+ fix different versions of commons-lang dependency and apache/spark#746 addendum
+ witgo <witgo@qq.com>
+ 2014-05-14 22:26:26 -0700
+ Commit: bae07e3, github.com/apache/spark/pull/754
+
+ Package docs
+ Prashant Sharma <prashant.s@imaginea.com>, Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 22:24:41 -0700
+ Commit: 4632427, github.com/apache/spark/pull/785
+
+ Documentation: Encourage use of reduceByKey instead of groupByKey.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 22:24:04 -0700
+ Commit: 21570b4, github.com/apache/spark/pull/784
+
+ Add language tabs and Python version to interactive part of quick-start
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-14 21:45:20 -0700
+ Commit: f10de04, github.com/apache/spark/pull/782
+
+ [SPARK-1840] SparkListenerBus prints out scary error message when terminated normally
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-14 21:13:41 -0700
+ Commit: ad4e60e, github.com/apache/spark/pull/783
+
+ default task number misleading in several places
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-05-14 18:20:20 -0700
+ Commit: 2f63995, github.com/apache/spark/pull/766
+
+ [SPARK-1826] fix the head notation of package object dsl
+ wangfei <scnbwf@yeah.net>
+ 2014-05-14 17:59:11 -0700
+ Commit: 44165fc, github.com/apache/spark/pull/765
+
+ [Typo] propertes -> properties
+ andrewor14 <andrewor14@gmail.com>
+ 2014-05-14 17:54:53 -0700
+ Commit: 9ad096d, github.com/apache/spark/pull/780
+
+ [SPARK-1696][MLLIB] use alpha in dense dspr
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-14 17:18:30 -0700
+ Commit: e3d72a7, github.com/apache/spark/pull/778
+
+ String interpolation + some other small changes
+ Jacek Laskowski <jacek@japila.pl>
+ 2014-05-14 15:45:52 -0700
+ Commit: 601e371, github.com/apache/spark/pull/748
+
+ [FIX] do not load defaults when testing SparkConf in pyspark
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-14 14:57:17 -0700
+ Commit: 94c6c06, github.com/apache/spark/pull/775
+
+ SPARK-1833 - Have an empty SparkContext constructor.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 12:53:30 -0700
+ Commit: 65533c7, github.com/apache/spark/pull/774
+
+ SPARK-1829 Sub-second durations shouldn't round to "0 s"
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-14 12:01:14 -0700
+ Commit: a3315d7, github.com/apache/spark/pull/768
+
+ Fix: sbt test throw an java.lang.OutOfMemoryError: PermGen space
+ witgo <witgo@qq.com>
+ 2014-05-14 11:19:26 -0700
+ Commit: fde82c1, github.com/apache/spark/pull/773
+
+ [SPARK-1620] Handle uncaught exceptions in function run by Akka scheduler
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-05-14 10:07:25 -0700
+ Commit: 17f3075, github.com/apache/spark/pull/622
+
+ SPARK-1828: Created forked version of hive-exec that doesn't bundle other dependencies
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 09:51:01 -0700
+ Commit: d58cb33, github.com/apache/spark/pull/767
+
+ SPARK-1818 Freshen Mesos documentation
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-14 09:45:33 -0700
+ Commit: d1d41cc, github.com/apache/spark/pull/756
+
+ SPARK-1827. LICENSE and NOTICE files need a refresh to contain transitive dependency info
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-14 09:38:33 -0700
+ Commit: 2e5a7cd, github.com/apache/spark/pull/770
+
+ Fixed streaming examples docs to use run-example instead of spark-submit
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-14 04:17:32 -0700
+ Commit: 68f28da, github.com/apache/spark/pull/722
+
+ [SPARK-1769] Executor loss causes NPE race condition
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-14 00:54:33 -0700
+ Commit: 69f7502, github.com/apache/spark/pull/762
+
+ Fix dep exclusion: avro-ipc, not avro, depends on netty.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-05-14 00:37:57 -0700
+ Commit: 54ae832, github.com/apache/spark/pull/763
+
+ SPARK-1801. expose InterruptibleIterator and TaskKilledException in deve...
+ Koert Kuipers <koert@tresata.com>
+ 2014-05-14 00:10:12 -0700
+ Commit: b22952f, github.com/apache/spark/pull/764
+
+ [SQL] Improve column pruning.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-13 23:27:22 -0700
+ Commit: 6ce0884, github.com/apache/spark/pull/729
+
+ Revert "[SPARK-1784] Add a new partitioner to allow specifying # of keys per partition"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-13 23:24:51 -0700
+ Commit: 7bb9a52
+
+ Implement ApproximateCountDistinct for SparkSql
+ larvaboy <larvaboy@gmail.com>
+ 2014-05-13 21:26:08 -0700
+ Commit: c33b8dc, github.com/apache/spark/pull/737
+
+ [SPARK-1784] Add a new partitioner to allow specifying # of keys per partition
+ Syed Hashmi <shashmi@cloudera.com>
+ 2014-05-13 21:24:23 -0700
+ Commit: 92cebad, github.com/apache/spark/pull/721
+
+ [SQL] Make it possible to create Java/Python SQLContexts from an existing Scala SQLContext.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-13 21:23:51 -0700
+ Commit: 4423386, github.com/apache/spark/pull/761
+
+ [SPARK-1527] change rootDir*.getName to rootDir*.getAbsolutePath
+ Ye Xianjin <advancedxy@gmail.com>
+ 2014-05-13 19:03:51 -0700
+ Commit: 753b04d, github.com/apache/spark/pull/436
+
+ [SPARK-1816] LiveListenerBus dies if a listener throws an exception
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-13 18:32:32 -0700
+ Commit: 5c0dafc, github.com/apache/spark/pull/759
+
+ SPARK-1791 - SVM implementation does not use threshold parameter
+ Andrew Tulloch <andrew@tullo.ch>
+ 2014-05-13 17:31:27 -0700
+ Commit: d1e4874, github.com/apache/spark/pull/725
+
+ SPARK-571: forbid return statements in cleaned closures
+ William Benton <willb@redhat.com>
+ 2014-05-13 13:45:23 -0700
+ Commit: 16ffadc, github.com/apache/spark/pull/717
+
+ BUILD: Add more content to make-distribution.sh.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 23:02:54 -0700
+ Commit: 52d9052
+
+ SPARK-1815. SparkContext should not be marked DeveloperApi
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-12 20:08:30 -0700
+ Commit: 2792bd0, github.com/apache/spark/pull/753
+
+ [SPARK-1753 / 1773 / 1814] Update outdated docs for spark-submit, YARN, standalone etc.
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 19:44:14 -0700
+ Commit: 2ffd1ea, github.com/apache/spark/pull/701
+
+ [SPARK-1780] Non-existent SPARK_DAEMON_OPTS is lurking around
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 19:42:35 -0700
+ Commit: ba96bb3, github.com/apache/spark/pull/751
+
+ SPARK-1757 Failing test for saving null primitives with .saveAsParquetFile()
+ Andrew Ash <andrew@andrewash.com>, Michael Armbrust <michael@databricks.com>
+ 2014-05-12 19:23:39 -0700
+ Commit: 156df87, github.com/apache/spark/pull/690
+
+ Modify a typo in monitoring.md
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-05-12 19:21:06 -0700
+ Commit: 9cf9f18, github.com/apache/spark/pull/698
+
+ L-BFGS Documentation
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-12 19:20:24 -0700
+ Commit: 5c2275d, github.com/apache/spark/pull/702
+
+ Typo: resond -> respond
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-12 18:46:28 -0700
+ Commit: a5150d1, github.com/apache/spark/pull/743
+
+ [SQL] Make Hive Metastore conversion functions publicly visible.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-12 18:40:30 -0700
+ Commit: 2f1a337, github.com/apache/spark/pull/750
+
+ Adding hadoop-2.2 profile to the build
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 15:40:48 -0700
+ Commit: 3e13b8c
+
+ [SPARK-1736] Spark submit for Windows
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 17:39:40 -0700
+ Commit: beb9cba, github.com/apache/spark/pull/745
+
+ SPARK-1802. (Addendium) Audit dependency graph when Spark is built with -Pyarn
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 17:35:29 -0700
+ Commit: 4b31f4e, github.com/apache/spark/pull/746
+
+ SPARK-1623: Use File objects instead of String's in HTTPBroadcast
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 17:27:28 -0700
+ Commit: 925d8b2, github.com/apache/spark/pull/749
+
+ Rename testExecutorEnvs --> executorEnvs.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 17:09:13 -0700
+ Commit: 3ce526b, github.com/apache/spark/pull/747
+
+ SPARK-1802. Audit dependency graph when Spark is built with -Phive
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 14:17:25 -0700
+ Commit: 8586bf5, github.com/apache/spark/pull/744
+
+ SPARK-1798. Tests should clean up temp files
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 14:16:19 -0700
+ Commit: 7120a29, github.com/apache/spark/pull/732
+
+ BUILD: Include Hive with default packages when creating a release
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 13:20:23 -0700
+ Commit: 1e4a65e
+
+ SPARK-1786: Reopening PR 724
+ Ankur Dave <ankurdave@gmail.com>, Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-12 13:05:24 -0700
+ Commit: 0e2bde2, github.com/apache/spark/pull/742
+
+ SPARK-1806: Upgrade Mesos dependency to 0.18.1
+ Bernardo Gomez Palacio <bernardo.gomezpalacio@gmail.com>
+ 2014-05-12 11:10:28 -0700
+ Commit: d9c97ba, github.com/apache/spark/pull/741
+
+ SPARK-1772 Stop catching Throwable, let Executors die
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-12 11:08:52 -0700
+ Commit: 3af1f38, github.com/apache/spark/pull/715
+
+ Revert "SPARK-1786: Edge Partition Serialization"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 10:49:03 -0700
+ Commit: af15c82
+
+ SPARK-1786: Edge Partition Serialization
+ Ankur Dave <ankurdave@gmail.com>, Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-11 19:20:42 -0700
+ Commit: a6b02fb, github.com/apache/spark/pull/724
+
+ Fix error in 2d Graph Partitioner
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-11 18:33:46 -0700
+ Commit: f938a15, github.com/apache/spark/pull/709
+
+ SPARK-1652: Set driver memory correctly in spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-11 18:17:34 -0700
+ Commit: 05c9aa9, github.com/apache/spark/pull/730
+
+ SPARK-1770: Load balance elements when repartitioning.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-11 17:11:55 -0700
+ Commit: 7d9cc92, github.com/apache/spark/pull/727
+
+ remove outdated runtime Information scala home
+ witgo <witgo@qq.com>
+ 2014-05-11 14:34:27 -0700
+ Commit: 6bee01d, github.com/apache/spark/pull/728
+
+ Enabled incremental build that comes with sbt 0.13.2
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-10 21:08:04 -0700
+ Commit: 70bcdef, github.com/apache/spark/pull/525
+
+ [SPARK-1774] Respect SparkSubmit --jars on YARN (client)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-10 20:58:02 -0700
+ Commit: 83e0424, github.com/apache/spark/pull/710
+
+ SPARK-1789. Multiple versions of Netty dependencies cause FlumeStreamSuite failure
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-10 20:50:40 -0700
+ Commit: 2b7bd29, github.com/apache/spark/pull/723
+
+ Unify GraphImpl RDDs + other graph load optimizations
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-05-10 14:48:07 -0700
+ Commit: 905173d, github.com/apache/spark/pull/497
+
+ [SPARK-1690] Tolerating empty elements when saving Python RDD to text files
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-10 14:01:08 -0700
+ Commit: 6c2691d, github.com/apache/spark/pull/644
+
+ Add Python includes to path before depickling broadcast values
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-10 13:02:13 -0700
+ Commit: 3776f2f, github.com/apache/spark/pull/656
+
+ fix broken in link in python docs
+ Andy Konwinski <andykonwinski@gmail.com>
+ 2014-05-10 12:46:51 -0700
+ Commit: c05d11b, github.com/apache/spark/pull/650
+
+ SPARK-1708. Add a ClassTag on Serializer and things that depend on it
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-10 12:10:24 -0700
+ Commit: 7eefc9d, github.com/apache/spark/pull/700
+
+ [SPARK-1778] [SQL] Add 'limit' transformation to SchemaRDD.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-10 12:03:27 -0700
+ Commit: 8e94d27, github.com/apache/spark/pull/711
+
+ [SQL] Upgrade parquet library.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-10 11:48:01 -0700
+ Commit: 4d60553, github.com/apache/spark/pull/684
+
+ [SPARK-1644] The org.datanucleus:* should not be packaged into spark-assembly-*.jar
+ witgo <witgo@qq.com>
+ 2014-05-10 10:15:04 -0700
+ Commit: 5615108, github.com/apache/spark/pull/688
+
+ SPARK-1686: keep schedule() calling in the main thread
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-05-09 21:50:23 -0700
+ Commit: 2f452cb, github.com/apache/spark/pull/639
+
+ SPARK-1770: Revert accidental(?) fix
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-09 14:51:34 -0700
+ Commit: 59577df, github.com/apache/spark/pull/716
+
+ [SPARK-1760]: fix building spark with maven documentation
+ witgo <witgo@qq.com>
+ 2014-05-09 01:51:26 -0700
+ Commit: bd67551, github.com/apache/spark/pull/712
+
+ Converted bang to ask to avoid scary warning when a block is removed
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-08 22:34:08 -0700
+ Commit: 32868f3, github.com/apache/spark/pull/708
+
+ MINOR: Removing dead code.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-08 22:33:06 -0700
+ Commit: 4c60fd1
+
+ SPARK-1775: Unneeded lock in ShuffleMapTask.deserializeInfo
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-08 22:30:17 -0700
+ Commit: 7db47c4, github.com/apache/spark/pull/707
+
+ SPARK-1565 (Addendum): Replace `run-example` with `spark-submit`.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-08 22:26:17 -0700
+ Commit: 06b15ba, github.com/apache/spark/pull/704
+
+ [SPARK-1631] Correctly set the Yarn app name when launching the AM.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-05-08 20:46:11 -0700
+ Commit: 3f779d8, github.com/apache/spark/pull/539
+
+ [SPARK-1755] Respect SparkSubmit --name on YARN
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-08 20:45:29 -0700
+ Commit: 8b78412, github.com/apache/spark/pull/699
+
+ Include the sbin/spark-config.sh in spark-executor
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-08 20:43:37 -0700
+ Commit: 2fd2752, github.com/apache/spark/pull/651
+
+ Bug fix of sparse vector conversion
+ Funes <tianshaocun@gmail.com>, funes <tianshaocun@gmail.com>
+ 2014-05-08 17:54:10 -0700
+ Commit: 191279c, github.com/apache/spark/pull/661
+
+ [SPARK-1157][MLlib] Bug fix: lossHistory should exclude rejection steps, and remove miniBatch
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-08 17:53:22 -0700
+ Commit: 910a13b, github.com/apache/spark/pull/582
+
+ MLlib documentation fix
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-08 17:52:32 -0700
+ Commit: d38febe, github.com/apache/spark/pull/703
+
+ [SPARK-1754] [SQL] Add missing arithmetic DSL operations.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-08 15:31:47 -0700
+ Commit: 322b180, github.com/apache/spark/pull/689
+
+ Fixing typo in als.py
+ Evan Sparks <evan.sparks@gmail.com>
+ 2014-05-08 13:07:30 -0700
+ Commit: 5c5e7d5, github.com/apache/spark/pull/696
+
+ [SPARK-1745] Move interrupted flag from TaskContext constructor (minor)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-08 12:13:07 -0700
+ Commit: c3f8b78, github.com/apache/spark/pull/675
+
+ SPARK-1565, update examples to be used with spark-submit script.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-08 10:23:05 -0700
+ Commit: 44dd57f, github.com/apache/spark/pull/552
+
+ [SQL] Improve SparkSQL Aggregates
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-08 01:08:43 -0400
+ Commit: 19c8fb0, github.com/apache/spark/pull/683
+
+ Use numpy directly for matrix multiply.
+ Evan Sparks <evan.sparks@gmail.com>
+ 2014-05-08 00:24:36 -0400
+ Commit: 6ed7e2c, github.com/apache/spark/pull/687
+
+ SPARK-1668: Add implicit preference as an option to examples/MovieLensALS
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-08 00:15:05 -0400
+ Commit: 108c4c1, github.com/apache/spark/pull/597
+
+ SPARK-1544 Add support for deep decision trees.
+ Manish Amde <manish9ue@gmail.com>, manishamde <manish9ue@gmail.com>, Evan Sparks <sparks@cs.berkeley.edu>
+ 2014-05-07 17:08:38 -0700
+ Commit: f269b01, github.com/apache/spark/pull/475
+
+ Update GradientDescentSuite.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-05-07 16:02:55 -0700
+ Commit: 0c19bb1, github.com/apache/spark/pull/588
+
+ [SPARK-1743][MLLIB] add loadLibSVMFile and saveAsLibSVMFile to pyspark
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-07 16:01:11 -0700
+ Commit: 3188553, github.com/apache/spark/pull/672
+
+ SPARK-1569 Spark on Yarn, authentication broken by pr299
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-07 15:51:53 -0700
+ Commit: 4bec84b, github.com/apache/spark/pull/649
+
+ [SPARK-1688] Propagate PySpark worker stderr to driver
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-07 14:35:22 -0700
+ Commit: 5200872, github.com/apache/spark/pull/603
+
+ Typo fix: fetchting -> fetching
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-07 17:24:49 -0400
+ Commit: d00981a, github.com/apache/spark/pull/680
+
+ Nicer logging for SecurityManager startup
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-07 17:24:12 -0400
+ Commit: 7f6f4a1, github.com/apache/spark/pull/678
+
+ [SQL] Fix Performance Issue in data type casting
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-05-07 16:54:58 -0400
+ Commit: ca43186, github.com/apache/spark/pull/679
+
+ SPARK-1579: Clean up PythonRDD and avoid swallowing IOExceptions
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-07 09:48:31 -0700
+ Commit: 3308722, github.com/apache/spark/pull/640
+
+ [SPARK-1460] Returning SchemaRDD instead of normal RDD on Set operations...
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-07 09:41:31 -0700
+ Commit: 967635a, github.com/apache/spark/pull/448
+
+ [WIP][Spark-SQL] Optimize the Constant Folding for Expression
+ Cheng Hao <hao.cheng@intel.com>, Michael Armbrust <michael@databricks.com>
+ 2014-05-07 03:37:12 -0400
+ Commit: 3eb53bd, github.com/apache/spark/pull/482
+
+ SPARK-1746: Support setting SPARK_JAVA_OPTS on executors for backwards compatibility
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-07 00:11:05 -0700
+ Commit: 913a0a9, github.com/apache/spark/pull/676
+
+ [HOTFIX] SPARK-1637: There are some Streaming examples added after the PR #571 was last updated.
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-06 21:55:05 -0700
+ Commit: fdae095, github.com/apache/spark/pull/673
+
+ Proposal: clarify Scala programming guide on caching ...
+ Ethan Jewett <esjewett@gmail.com>
+ 2014-05-06 20:50:08 -0700
+ Commit: 48ba3b8, github.com/apache/spark/pull/668
+
+ SPARK-1727. Correct small compile errors, typos, and markdown issues in (primarly) MLlib docs
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-06 20:07:22 -0700
+ Commit: 25ad8f9, github.com/apache/spark/pull/653
+
+ SPARK-1637: Clean up examples for 1.0
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-06 17:27:52 -0700
+ Commit: a000b5c, github.com/apache/spark/pull/571
+
+ SPARK-1737: Warn rather than fail when Java 7+ is used to create distributions
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-06 15:41:46 -0700
+ Commit: 39b8b14, github.com/apache/spark/pull/669
+
+ [SPARK-1549] Add Python support to spark-submit
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-06 15:12:35 -0700
+ Commit: 951a5d9, github.com/apache/spark/pull/664
+
+ SPARK-1734: spark-submit throws an exception: Exception in thread "main"...
+ witgo <witgo@qq.com>
+ 2014-05-06 14:17:39 -0700
+ Commit: ec09acd, github.com/apache/spark/pull/665
+
+ [SPARK-1685] Cancel retryTimer on restart of Worker or AppClient
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-05-06 12:53:39 -0700
+ Commit: fbfe69d, github.com/apache/spark/pull/602
+
+ Fix two download suggestions in the docs:
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-06 12:07:46 -0700
+ Commit: 7b978c1, github.com/apache/spark/pull/662
+
+ SPARK-1474: Spark on yarn assembly doesn't include AmIpFilter
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-06 12:00:09 -0700
+ Commit: 1e82990, github.com/apache/spark/pull/406
+
+ Update OpenHashSet.scala
+ ArcherShao <ArcherShao@users.noreply.github.com>
+ 2014-05-06 10:12:59 -0700
+ Commit: 0a5a468, github.com/apache/spark/pull/667
+
+ [SQL] SPARK-1732 - Support for null primitive values.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-05 22:59:42 -0700
+ Commit: 3c64750, github.com/apache/spark/pull/658
+
+ [SPARK-1735] Add the missing special profiles to make-distribution.sh
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 22:14:47 -0700
+ Commit: a2262cd, github.com/apache/spark/pull/660
+
+ [SPARK-1678][SPARK-1679] In-memory compression bug fix and made compression configurable, disabled by default
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-05 19:38:59 -0700
+ Commit: 6d721c5, github.com/apache/spark/pull/608
+
+ [SPARK-1594][MLLIB] Cleaning up MLlib APIs and guide
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-05 18:32:54 -0700
+ Commit: 98750a7, github.com/apache/spark/pull/524
+
+ Expose SparkListeners and relevant classes as DeveloperApi
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 18:32:14 -0700
+ Commit: ea10b31, github.com/apache/spark/pull/648
+
+ SPARK-1728. JavaRDDLike.mapPartitionsWithIndex requires ClassTag
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-05 18:26:34 -0700
+ Commit: 8e724dc, github.com/apache/spark/pull/657
+
+ [SPARK-1681] Include datanucleus jars in Spark Hive distribution
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 16:28:07 -0700
+ Commit: cf0a8f0, github.com/apache/spark/pull/610
+
+ [SPARK-1504], [SPARK-1505], [SPARK-1558] Updated Spark Streaming guide
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-05 15:28:19 -0700
+ Commit: a975a19, github.com/apache/spark/pull/652
+
+ SPARK-1721: Reset the thread classLoader in the Mesos Executor
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-05 11:19:35 -0700
+ Commit: 3292e2a, github.com/apache/spark/pull/620
+
+ SPARK-1556. jets3t dep doesn't update properly with newer Hadoop versions
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-05 10:33:49 -0700
+ Commit: 73b0cbc, github.com/apache/spark/pull/629
+
+ Updated doc for spark.closure.serializer to indicate only Java serializer work.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-05 00:52:06 -0700
+ Commit: f2eb070, github.com/apache/spark/pull/642
+
+ Address SPARK-1717
+ msiddalingaiah <madhu@madhu.com>
+ 2014-05-04 21:59:10 -0700
+ Commit: bb2bb0c, github.com/apache/spark/pull/641
+
+ SPARK-1710: spark-submit should print better errors than "InvocationTargetException"
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-04 20:51:53 -0700
+ Commit: b48a55a, github.com/apache/spark/pull/630
+
+ EC2 script should exit with non-zero code on UsageError
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-05-04 20:36:51 -0700
+ Commit: bcb9b7f, github.com/apache/spark/pull/638
+
+ SPARK-1693: Most of the tests throw a java.lang.SecurityException when s...
+ witgo <witgo@qq.com>
+ 2014-05-04 17:48:52 -0700
+ Commit: d940e4c, github.com/apache/spark/pull/628
+
+ SPARK-1629. Addendum: Depend on commons lang3 (already used by tachyon) as it's used in ReplSuite, and return to use lang3 utility in Utils.scala
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-04 17:43:28 -0700
+ Commit: f504157, github.com/apache/spark/pull/635
+
+ SPARK-1703 Warn users if Spark is run on JRE6 but compiled with JDK7.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-04 12:22:23 -0700
+ Commit: 0c98a8f, github.com/apache/spark/pull/627
+
+ SPARK-1663. (Addendum) Fix signature of one version of JavaPairRDDStream.reduceByKeyAndWindow()
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-04 11:55:29 -0700
+ Commit: 0088ced, github.com/apache/spark/pull/633
+
+ SPARK-1658: Correctly identify if maven is installed and working
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-05-04 11:08:39 -0700
+ Commit: e97a2e6, github.com/apache/spark/pull/580
+
+ The default version of yarn is equal to the hadoop version
+ witgo <witgo@qq.com>
+ 2014-05-03 23:32:12 -0700
+ Commit: fb05432, github.com/apache/spark/pull/626
+
+ Whitelist Hive Tests
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-03 23:13:51 -0700
+ Commit: 92b2902, github.com/apache/spark/pull/596
+
+ [SQL] Better logging when applying rules.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-03 18:38:44 -0700
+ Commit: b295714, github.com/apache/spark/pull/616
+
+ EC2 configurable workers
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-05-03 16:52:19 -0700
+ Commit: 4669a84, github.com/apache/spark/pull/612
+
+ SPARK-1689 AppClient should indicate app is dead() when removed
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-03 13:27:10 -0700
+ Commit: 34719ba, github.com/apache/spark/pull/605
+
+ [Bugfix] Tachyon file cleanup logical error
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-03 13:23:52 -0700
+ Commit: ce72c72, github.com/apache/spark/pull/575
+
+ SPARK-1663. Corrections for several compile errors in streaming code examples, and updates to follow API changes
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-03 12:31:31 -0700
+ Commit: 11d5494, github.com/apache/spark/pull/589
+
+ [WIP] SPARK-1676: Cache Hadoop UGIs by default to prevent FileSystem leak
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-03 10:59:05 -0700
+ Commit: 3d0a02d, github.com/apache/spark/pull/621
+
+ Update SchemaRDD.scala
+ ArcherShao <ArcherShao@users.noreply.github.com>
+ 2014-05-03 00:17:36 -0700
+ Commit: 9347565, github.com/apache/spark/pull/619
+
+ SPARK-1700: Close socket file descriptors on task completion
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-02 23:55:13 -0700
+ Commit: 0a14421, github.com/apache/spark/pull/623
+
+ SPARK-1492. Update Spark YARN docs to use spark-submit
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-02 21:42:31 -0700
+ Commit: 2b961d8, github.com/apache/spark/pull/601
+
+ delete no use var
+ wangfei <wangfei_hello@126.com>
+ 2014-05-02 21:34:54 -0700
+ Commit: 4bf24f7, github.com/apache/spark/pull/613
+
+ SPARK-1695: java8-tests compiler error: package com.google.common.co...
+ witgo <witgo@qq.com>
+ 2014-05-02 12:40:27 -0700
+ Commit: f25ebed, github.com/apache/spark/pull/611
+
+ Add tests for FileLogger, EventLoggingListener, and ReplayListenerBus
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-01 21:42:06 -0700
+ Commit: 394d8cb, github.com/apache/spark/pull/591
+
+ SPARK-1659: improvements spark-submit usage
+ witgo <witgo@qq.com>
+ 2014-05-01 21:39:40 -0700
+ Commit: 40cf6d3, github.com/apache/spark/pull/581
+
+ fix the spelling mistake
+ wangfei <wangfei_hello@126.com>
+ 2014-05-01 21:37:22 -0700
+ Commit: 55c760f, github.com/apache/spark/pull/614
+
+ [SQL] SPARK-1661 - Fix regex_serde test
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-01 21:32:43 -0700
+ Commit: a43d9c1, github.com/apache/spark/pull/595
+
+ SPARK-1691: Support quoted arguments inside of spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-01 01:15:51 -0700
+ Commit: 98b6559, github.com/apache/spark/pull/609
+
+ Fix SPARK-1629: Spark should inline use of commons-lang `SystemUtils.IS_...
+ witgo <witgo@qq.com>
+ 2014-04-30 09:49:45 -0700
+ Commit: 55100da, github.com/apache/spark/pull/569
+
+ SPARK-1004. PySpark on YARN
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-29 23:24:34 -0700
+ Commit: ff5be9a, github.com/apache/spark/pull/30
+
+ Handle the vals that never used
+ WangTao <barneystinson@aliyun.com>
+ 2014-04-29 22:07:20 -0700
+ Commit: 7025dda, github.com/apache/spark/pull/565
+
+ Args for worker rather than master
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-29 22:05:40 -0700
+ Commit: b3d2ab6, github.com/apache/spark/pull/587
+
+ [SPARK-1646] Micro-optimisation of ALS
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-29 22:04:34 -0700
+ Commit: 5c0cd5c, github.com/apache/spark/pull/568
+
+ [SPARK-1674] fix interrupted system call error in pyspark's RDD.pipe
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-29 18:06:45 -0700
+ Commit: d33df1c, github.com/apache/spark/pull/594
+
+ SPARK-1588. Restore SPARK_YARN_USER_ENV and SPARK_JAVA_OPTS for YARN.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-29 12:54:02 -0700
+ Commit: bf8d0aa, github.com/apache/spark/pull/586
+
+ SPARK-1509: add zipWithIndex zipWithUniqueId methods to java api
+ witgo <witgo@qq.com>
+ 2014-04-29 11:30:47 -0700
+ Commit: 7d15058, github.com/apache/spark/pull/423
+
+ SPARK-1557 Set permissions on event log files/directories
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-29 09:19:48 -0500
+ Commit: 8db0f7e, github.com/apache/spark/pull/538
+
+ HOTFIX: minor change to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:59:38 -0700
+ Commit: 9a1184a
+
+ HOTFIX: minor change to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:53:32 -0700
+ Commit: f04bcaf
+
+ [SPARK-1636][MLLIB] Move main methods to examples
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-29 00:41:03 -0700
+ Commit: 3f38334, github.com/apache/spark/pull/584
+
+ Minor fix to python table caching API.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-29 00:36:15 -0700
+ Commit: 497be3c, github.com/apache/spark/pull/585
+
+ HOTFIX: Bug in release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:10:17 -0700
+ Commit: 719c8bc
+
+ Improved build configuration
+ witgo <witgo@qq.com>
+ 2014-04-28 22:50:51 -0700
+ Commit: 030f2c2, github.com/apache/spark/pull/480
+
+ SPARK-1652: Remove incorrect deprecation warning in spark-submit
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 18:14:59 -0700
+ Commit: 9f7a095, github.com/apache/spark/pull/578
+
+ SPARK-1654 and SPARK-1653: Fixes in spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 17:29:22 -0700
+ Commit: 949e393, github.com/apache/spark/pull/576
+
+ SPARK-1652: Spark submit should fail gracefully if YARN not enabled
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 17:26:57 -0700
+ Commit: cae054a, github.com/apache/spark/pull/579
+
+ Changes to dev release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 13:58:42 -0700
+ Commit: 8421034
+
+ [SPARK-1633][Streaming] Java API unit test and example for custom streaming receiver in Java
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-28 13:58:09 -0700
+ Commit: 1d84964, github.com/apache/spark/pull/558
+
+ [SQL]Append some missing types for HiveUDF
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-04-27 23:59:42 -0700
+ Commit: f735884, github.com/apache/spark/pull/459
+
+ Update the import package name for TestHive in sbt shell
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-04-27 23:57:29 -0700
+ Commit: ea01aff, github.com/apache/spark/pull/574
+
+ Fix SPARK-1609: Executor fails to start when Command.extraJavaOptions contains multiple Java options
+ witgo <witgo@qq.com>
+ 2014-04-27 19:41:02 -0700
+ Commit: 71f4d26, github.com/apache/spark/pull/547
+
+ SPARK-1145: Memory mapping with many small blocks can cause JVM allocation failures
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 17:40:56 -0700
+ Commit: 6b3c6e5, github.com/apache/spark/pull/43
+
+ HOTFIX: Minor patch to merge script.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 15:45:17 -0700
+ Commit: 3d9fb09
+
+ SPARK-1651: Delete existing deployment directory
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-04-27 15:50:48 -0700
+ Commit: eefb90d, github.com/apache/spark/pull/573
+
+ SPARK-1648 Support closing JIRA's as part of merge script.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 15:41:57 -0700
+ Commit: fe65bee, github.com/apache/spark/pull/570
+
+ SPARK-1650: Correctly identify maven project version
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-04-27 15:17:06 -0700
+ Commit: 7b2527d, github.com/apache/spark/pull/572
+
+ SPARK-1606: Infer user application arguments instead of requiring --arg.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-26 19:24:29 -0700
+ Commit: aa9a7f5, github.com/apache/spark/pull/563
+
+ SPARK-1467: Make StorageLevel.apply() factory methods Developer APIs
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-26 19:04:33 -0700
+ Commit: 762af4e, github.com/apache/spark/pull/551
+
+ [SPARK-1608] [SQL] Fix Cast.nullable when cast from StringType to NumericType/TimestampType.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-04-26 14:39:54 -0700
+ Commit: 8e37ed6, github.com/apache/spark/pull/532
+
+ add note of how to support table with more than 22 fields
+ wangfei <wangfei1@huawei.com>
+ 2014-04-26 14:38:42 -0700
+ Commit: e6e44e4, github.com/apache/spark/pull/564
+
+ [Spark-1382] Fix NPE in DStream.slice (updated version of #365)
+ zsxwing <zsxwing@gmail.com>, Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-25 19:04:34 -0700
+ Commit: 058797c, github.com/apache/spark/pull/562
+
+ SPARK-1632. Remove unnecessary boxing in compares in ExternalAppendOnlyM...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-25 17:55:04 -0700
+ Commit: 87cf35c, github.com/apache/spark/pull/559
+
+ SPARK-1235: manage the DAGScheduler EventProcessActor with supervisor and refactor the DAGScheduler with Akka
+ CodingCat <zhunansjtu@gmail.com>, Xiangrui Meng <meng@databricks.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-04-25 16:04:48 -0700
+ Commit: 027f1b8, github.com/apache/spark/pull/186
+
+ SPARK-1607. HOTFIX: Fix syntax adapting Int result to Short
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-25 14:17:38 -0700
+ Commit: df6d814, github.com/apache/spark/pull/556
+
+ Update KafkaWordCount.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-25 13:18:49 -0700
+ Commit: 8aaef5c, github.com/apache/spark/pull/523
+
+ Delete the val that never used
+ WangTao <barneystinson@aliyun.com>
+ 2014-04-25 11:47:01 -0700
+ Commit: 25a276d, github.com/apache/spark/pull/553
+
+ SPARK-1621 Upgrade Chill to 0.3.6
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-25 11:12:41 -0700
+ Commit: a24d918, github.com/apache/spark/pull/543
+
+ SPARK-1619 Launch spark-shell with spark-submit
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-24 23:59:16 -0700
+ Commit: dc3b640, github.com/apache/spark/pull/542
+
+ SPARK-1607. Replace octal literals, removed in Scala 2.11, with hex literals
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-24 23:34:00 -0700
+ Commit: 6e101f1, github.com/apache/spark/pull/529
+
+ Call correct stop().
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-24 23:22:03 -0700
+ Commit: 45ad7f0, github.com/apache/spark/pull/527
+
+ SPARK-1242 Add aggregate to python rdd
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-24 23:07:54 -0700
+ Commit: e03bc37, github.com/apache/spark/pull/139
+
+ Fix [SPARK-1078]: Remove the Unnecessary lift-json dependency
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-24 21:51:52 -0700
+ Commit: 095b518, github.com/apache/spark/pull/536
+
+ [Typo] In the maven docs: chd -> cdh
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-24 21:51:17 -0700
+ Commit: 06e82d9, github.com/apache/spark/pull/548
+
+ Generalize pattern for planning hash joins.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 21:42:33 -0700
+ Commit: 86ff8b1, github.com/apache/spark/pull/418
+
+ [SPARK-1617] and [SPARK-1618] Improvements to streaming ui and bug fix to socket receiver
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 21:34:37 -0700
+ Commit: cd12dd9, github.com/apache/spark/pull/540
+
+ SPARK-1586 Windows build fixes
+ Mridul Muralidharan <mridulm80@apache.org>
+ 2014-04-24 20:48:33 -0700
+ Commit: 968c018, github.com/apache/spark/pull/505
+
+ SPARK-1584: Upgrade Flume dependency to 1.4.0
+ tmalaska <ted.malaska@cloudera.com>
+ 2014-04-24 20:31:17 -0700
+ Commit: d5c6ae6, github.com/apache/spark/pull/507
+
+ [SPARK-986]: Job cancelation for PySpark
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-04-24 20:21:10 -0700
+ Commit: e53eb4f, github.com/apache/spark/pull/541
+
+ [SPARK-1615] Synchronize accesses to the LiveListenerBus' event queue
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-24 20:18:15 -0700
+ Commit: ee6f7e2, github.com/apache/spark/pull/544
+
+ [SPARK-1510] Spark Streaming metrics source for metrics system
+ jerryshao <saisai.shao@intel.com>, Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 18:56:57 -0700
+ Commit: 80429f3, github.com/apache/spark/pull/545
+
+ Spark 1489 Fix the HistoryServer view acls
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-24 18:38:10 -0700
+ Commit: 44da5ab, github.com/apache/spark/pull/509
+
+ [SQL] Add support for parsing indexing into arrays in SQL.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 18:21:00 -0700
+ Commit: 4660991, github.com/apache/spark/pull/518
+
+ [SPARK-1592][streaming] Automatically remove streaming input blocks
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 18:18:22 -0700
+ Commit: 526a518, github.com/apache/spark/pull/512
+
+ SPARK-1438 RDD.sample() make seed param optional
+ Arun Ramakrishnan <smartnut007@gmail.com>
+ 2014-04-24 17:27:16 -0700
+ Commit: 35e3d19, github.com/apache/spark/pull/477
+
+ SPARK-1104: kill Process in workerThread of ExecutorRunner
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-24 15:55:18 -0700
+ Commit: f99af85, github.com/apache/spark/pull/35
+
+ Fix Scala Style
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-24 15:07:23 -0700
+ Commit: a03ac22, github.com/apache/spark/pull/531
+
+ SPARK-1494 Don't initialize classes loaded by MIMA excludes, attempt 2
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 14:54:01 -0700
+ Commit: c5c1916, github.com/apache/spark/pull/526
+
+ Spark 1490 Add kerberos support to the HistoryServer
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-24 11:15:12 -0700
+ Commit: bd37509, github.com/apache/spark/pull/513
+
+ SPARK-1611: Fix incorrect initialization order in AppendOnlyMap
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-24 11:13:40 -0700
+ Commit: 78a49b2, github.com/apache/spark/pull/534
+
+ SPARK-1488. Squash more language feature warnings in new commits by importing implicitConversion
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-24 10:06:18 -0700
+ Commit: 6338a93, github.com/apache/spark/pull/528
+
+ Small changes to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-24 09:59:44 -0700
+ Commit: faeb761
+
+ [SPARK-1610] [SQL] Fix Cast to use exact type value when cast from BooleanType to NumericTy...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-04-24 09:57:28 -0700
+ Commit: 27b2821, github.com/apache/spark/pull/533
+
+ SPARK-1601 & SPARK-1602: two bug fixes related to cancellation
+ Reynold Xin <rxin@apache.org>
+ 2014-04-24 00:27:45 -0700
+ Commit: 1fdf659, github.com/apache/spark/pull/521
+
+ SPARK-1587 Fix thread leak
+ Mridul Muralidharan <mridulm80@apache.org>
+ 2014-04-23 23:20:55 -0700
+ Commit: dd681f5, github.com/apache/spark/pull/504
+
+ [Fix #79] Replace Breakable For Loops By While Loops
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-23 22:47:59 -0700
+ Commit: bb68f47, github.com/apache/spark/pull/503
+
+ SPARK-1589: Fix the incorrect compare
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-23 22:36:02 -0700
+ Commit: 6ab7578, github.com/apache/spark/pull/508
+
+ Mark all fields of EdgePartition, Graph, and GraphOps transient
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-23 22:01:13 -0700
+ Commit: 1d6abe3, github.com/apache/spark/pull/520
+
+ Update Java api for setJobGroup with interruptOnCancel
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 22:00:22 -0700
+ Commit: d485eec, github.com/apache/spark/pull/522
+
+ [Hot Fix #469] Fix flaky test in SparkListenerSuite
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-23 21:59:33 -0700
+ Commit: 4b2bab1, github.com/apache/spark/pull/516
+
+ [SPARK-1540] Add an optional Ordering parameter to PairRDDFunctions.
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-23 17:03:54 -0700
+ Commit: 640f9a0, github.com/apache/spark/pull/487
+
+ SPARK-1582 Invoke Thread.interrupt() when cancelling jobs
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 16:52:49 -0700
+ Commit: 432201c, github.com/apache/spark/pull/498
+
+ Honor default fs name when initializing event logger.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-23 14:47:38 -0700
+ Commit: dd1b7a6, github.com/apache/spark/pull/450
+
+ SPARK-1572 Don't kill Executor if PythonRDD fails while computing parent
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 14:46:30 -0700
+ Commit: a967b00, github.com/apache/spark/pull/486
+
+ SPARK-1583: Fix a bug that using java.util.HashMap by mistake
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-23 14:12:20 -0700
+ Commit: a664606, github.com/apache/spark/pull/500
+
+ SPARK-1119 and other build improvements
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-23 10:19:32 -0700
+ Commit: cd4ed29, github.com/apache/spark/pull/502
+
+ [SQL] SPARK-1571 Mistake in java example code
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 22:19:32 -0700
+ Commit: 39f85e0, github.com/apache/spark/pull/496
+
+ SPARK-1494 Don't initialize classes loaded by MIMA excludes.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 21:56:15 -0700
+ Commit: 8e95081, github.com/apache/spark/pull/494
+
+ SPARK-1562 Fix visibility / annotation of Spark SQL APIs
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 20:02:33 -0700
+ Commit: aa77f8a, github.com/apache/spark/pull/489
+
+ [FIX: SPARK-1376] use --arg instead of --args in SparkSubmit to avoid warning messages
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-22 19:38:27 -0700
+ Commit: 662c860, github.com/apache/spark/pull/485
+
+ [streaming][SPARK-1578] Removed requirement for TTL in StreamingContext.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-22 19:35:13 -0700
+ Commit: f3d19a9, github.com/apache/spark/pull/491
+
+ [Spark-1538] Fix SparkUI incorrectly hiding persisted RDDs
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-22 19:24:03 -0700
+ Commit: 2de5738, github.com/apache/spark/pull/469
+
+ Assorted clean-up for Spark-on-YARN.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-22 19:22:06 -0700
+ Commit: 995fdc9, github.com/apache/spark/pull/488
+
+ [SPARK-1570] Fix classloading in JavaSQLContext.applySchema
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-22 15:05:12 -0700
+ Commit: ea8cea8, github.com/apache/spark/pull/484
+
+ Fix compilation on Hadoop 2.4.x.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-22 14:28:41 -0700
+ Commit: 0ea0b1a, github.com/apache/spark/pull/483
+
+ [Fix #204] Eliminate delay between binding and log checking
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-22 14:27:49 -0700
+ Commit: 745e496, github.com/apache/spark/pull/441
+
+ [SPARK-1506][MLLIB] Documentation improvements for MLlib 1.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-22 11:20:47 -0700
+ Commit: 26d35f3, github.com/apache/spark/pull/422
+
+ [SPARK-1281] Improve partitioning in ALS
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-22 11:07:30 -0700
+ Commit: bf9d49b, github.com/apache/spark/pull/407
+
+ fix bugs of dot in python
+ Xusen Yin <yinxusen@gmail.com>
+ 2014-04-22 11:06:18 -0700
+ Commit: c919798, github.com/apache/spark/pull/463
+
+ [SPARK-1560]: Updated Pyrolite Dependency to be Java 6 compatible
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-04-22 09:44:41 -0700
+ Commit: 0f87e6a, github.com/apache/spark/pull/479
+
+ [HOTFIX] SPARK-1399: remove outdated comments
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-22 09:43:13 -0700
+ Commit: 87de290, github.com/apache/spark/pull/474
+
+ SPARK-1496: Have jarOfClass return Option[String]
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-22 00:42:16 -0700
+ Commit: 83084d3, github.com/apache/spark/pull/438
+
+ [SPARK-1459] Use local path (and not complete URL) when opening local lo...
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-21 23:10:53 -0700
+ Commit: ac164b7, github.com/apache/spark/pull/375
+
+ [Fix #274] Document + fix annotation usages
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-21 22:24:44 -0700
+ Commit: b3e5366, github.com/apache/spark/pull/470
+
+ [SPARK-1439, SPARK-1440] Generate unified Scaladoc across projects and Javadocs
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-21 21:57:40 -0700
+ Commit: fc78384, github.com/apache/spark/pull/457
+
+ [SPARK-1332] Improve Spark Streaming's Network Receiver and InputDStream API [WIP]
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-21 19:04:49 -0700
+ Commit: 04c37b6, github.com/apache/spark/pull/300
+
+ Dev script: include RC name in git tag
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-21 14:21:17 -0700
+ Commit: 5a5b334
+
+ SPARK-1399: show stage failure reason in UI
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-04-21 14:10:23 -0700
+ Commit: 43e4a29, github.com/apache/spark/pull/421
+
+ SPARK-1539: RDDPage.scala contains RddPage class
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-21 12:48:02 -0700
+ Commit: b7df31e, github.com/apache/spark/pull/454
+
+ [Hot Fix] Ignore org.apache.spark.ui.UISuite tests
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-21 12:37:43 -0700
+ Commit: af46f1f, github.com/apache/spark/pull/466
+
+ Clean up and simplify Spark configuration
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-21 10:26:33 -0700
+ Commit: fb98488, github.com/apache/spark/pull/299
+
+ REPL cleanup.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 17:32:24 -0700
+ Commit: 3a390bf, github.com/apache/spark/pull/451
+
+ [SPARK-1535] ALS: Avoid the garbage-creating ctor of DoubleMatrix
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-19 15:10:18 -0700
+ Commit: 25fc318, github.com/apache/spark/pull/442
+
+ Add insertInto and saveAsTable to Python API.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 15:08:54 -0700
+ Commit: 10d0421, github.com/apache/spark/pull/447
+
+ Use scala deprecation instead of java.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 15:06:04 -0700
+ Commit: 5d0f58b, github.com/apache/spark/pull/452
+
+ README update
+ Reynold Xin <rxin@apache.org>
+ 2014-04-18 22:34:39 -0700
+ Commit: 28238c8, github.com/apache/spark/pull/443
+
+ SPARK-1482: Fix potential resource leaks in saveAsHadoopDataset and save...
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-18 17:49:22 -0700
+ Commit: 2089e0e, github.com/apache/spark/pull/400
+
+ SPARK-1456 Remove view bounds on Ordered in favor of a context bound on Ordering.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-18 12:04:13 -0700
+ Commit: c399baa, github.com/apache/spark/pull/410
+
+ Fixed broken pyspark shell.
+ Reynold Xin <rxin@apache.org>
+ 2014-04-18 10:10:13 -0700
+ Commit: 81a152c, github.com/apache/spark/pull/444
+
+ SPARK-1523: improve the readability of code in AkkaUtil
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-18 10:05:00 -0700
+ Commit: 3c7a9ba, github.com/apache/spark/pull/434
+
+ SPARK-1357 (addendum). More Experimental items in MLlib
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-18 10:04:02 -0700
+ Commit: 8aa1f4c, github.com/apache/spark/pull/372
+
+ [SPARK-1520] remove fastutil from dependencies
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-18 10:03:15 -0700
+ Commit: aa17f02, github.com/apache/spark/pull/437
+
+ Reuses Row object in ExistingRdd.productToRowRdd()
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-18 10:02:27 -0700
+ Commit: 89f4743, github.com/apache/spark/pull/432
+
+ SPARK-1483: Rename minSplits to minPartitions in public APIs
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-18 10:01:16 -0700
+ Commit: e31c8ff, github.com/apache/spark/pull/430
+
+ HOTFIX: Ignore streaming UI test
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-17 17:33:24 -0700
+ Commit: 7863ecc, github.com/apache/spark/pull/440
+
+ FIX: Don't build Hive in assembly unless running Hive tests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-17 17:24:00 -0700
+ Commit: 6c746ba, github.com/apache/spark/pull/439
+
+ SPARK-1408 Modify Spark on Yarn to point to the history server when app ...
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-17 16:36:37 -0500
+ Commit: 0058b5d, github.com/apache/spark/pull/362
+
+ [SPARK-1395] Allow "local:" URIs to work on Yarn.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-17 10:29:38 -0500
+ Commit: 6904750, github.com/apache/spark/pull/303
+
+ [python alternative] pyspark require Python2, failing if system default is Py3 from shell.py
+ AbhishekKr <abhikumar163@gmail.com>
+ 2014-04-16 19:05:40 -0700
+ Commit: bb76eae, github.com/apache/spark/pull/399
+
+ SPARK-1462: Examples of ML algorithms are using deprecated APIs
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-16 18:23:07 -0700
+ Commit: 6ad4c54, github.com/apache/spark/pull/416
+
+ Include stack trace for exceptions thrown by user code.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-16 18:12:56 -0700
+ Commit: d4916a8, github.com/apache/spark/pull/409
+
+ Update ReducedWindowedDStream.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-16 18:08:11 -0700
+ Commit: 07b7ad3, github.com/apache/spark/pull/425
+
+ misleading task number of groupByKey
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 17:58:42 -0700
+ Commit: 9c40b9e, github.com/apache/spark/pull/403
+
+ Fixing a race condition in event listener unit test
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-16 17:39:11 -0700
+ Commit: 38877cc, github.com/apache/spark/pull/401
+
+ remove unnecessary brace and semicolon in 'putBlockInfo.synchronize' block
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 17:30:01 -0700
+ Commit: 016a877, github.com/apache/spark/pull/411
+
+ SPARK-1329: Create pid2vid with correct number of partitions
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-16 17:16:55 -0700
+ Commit: 17d3234, github.com/apache/spark/pull/368
+
+ Rebuild routing table after Graph.reverse
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-16 17:15:50 -0700
+ Commit: 235a47c, github.com/apache/spark/pull/431
+
+ Add clean to build
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-16 16:32:34 -0700
+ Commit: 987760e
+
+ [SPARK-1511] use Files.move instead of renameTo in TestUtils.scala
+ Ye Xianjin <advancedxy@gmail.com>
+ 2014-04-16 14:56:22 -0700
+ Commit: 10b1c59, github.com/apache/spark/pull/427
+
+ SPARK-1465: Spark compilation is broken with the latest hadoop-2.4.0 release
+ xuan <xuan@MacBook-Pro.local>, xuan <xuan@macbook-pro.home>
+ 2014-04-16 14:41:22 -0500
+ Commit: 725925c, github.com/apache/spark/pull/396
+
+ SPARK-1469: Scheduler mode should accept lower-case definitions and have...
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-16 09:58:57 -0700
+ Commit: e269c24, github.com/apache/spark/pull/388
+
+ Minor addition to SPARK-1497
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-16 09:43:17 -0700
+ Commit: 82349fb
+
+ SPARK-1497. Fix scalastyle warnings in YARN, Hive code
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-16 09:34:59 -0700
+ Commit: 77f8367, github.com/apache/spark/pull/413
+
+ SPARK-1310: Start adding k-fold cross validation to MLLib [adds kFold to MLUtils & fixes bug in BernoulliSampler]
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-16 09:33:27 -0700
+ Commit: c3527a3, github.com/apache/spark/pull/18
+
+ update spark.default.parallelism
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 09:14:18 -0700
+ Commit: 9edd887, github.com/apache/spark/pull/389
+
+ Loads test tables when running "sbt hive/console" without HIVE_DEV_HOME
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-16 08:54:34 -0700
+ Commit: fec462c, github.com/apache/spark/pull/417
+
+ Make "spark logo" link refer to "/".
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-16 08:53:01 -0700
+ Commit: c0273d8, github.com/apache/spark/pull/408
+
+ [SPARK-959] Updated SBT from 0.13.1 to 0.13.2
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-16 08:52:14 -0700
+ Commit: 6a10d80, github.com/apache/spark/pull/426
+
+ [SQL] SPARK-1424 Generalize insertIntoTable functions on SchemaRDDs
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-15 20:40:40 -0700
+ Commit: 273c2fd, github.com/apache/spark/pull/354
+
+ [WIP] SPARK-1430: Support sparse data in Python MLlib
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-15 20:33:24 -0700
+ Commit: 63ca581, github.com/apache/spark/pull/341
+
+ [FIX] update sbt-idea to version 1.6.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-15 19:37:32 -0700
+ Commit: 8517911, github.com/apache/spark/pull/419
+
+ SPARK-1455: Better isolation for unit tests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-15 19:34:39 -0700
+ Commit: 5aaf983, github.com/apache/spark/pull/420
+
+ Decision Tree documentation for MLlib programming guide
+ Manish Amde <manish9ue@gmail.com>
+ 2014-04-15 11:14:28 -0700
+ Commit: 07d72fe, github.com/apache/spark/pull/402
+
+ [SPARK-1157][MLlib] L-BFGS Optimizer based on Breeze's implementation.
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-04-15 11:12:47 -0700
+ Commit: 6843d63, github.com/apache/spark/pull/353
+
+ SPARK-1501: Ensure assertions in Graph.apply are asserted.
+ William Benton <willb@redhat.com>
+ 2014-04-15 10:38:42 -0700
+ Commit: 2580a3b, github.com/apache/spark/pull/415
+
+ SPARK-1426: Make MLlib work with NumPy versions older than 1.7
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-15 00:19:43 -0700
+ Commit: df36091, github.com/apache/spark/pull/391
+
+ SPARK-1374: PySpark API for SparkSQL
+ Ahir Reddy <ahirreddy@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-04-15 00:07:55 -0700
+ Commit: c99bcb7f, github.com/apache/spark/pull/363
+
+ SPARK-1488. Resolve scalac feature warnings during build
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-14 19:50:00 -0700
+ Commit: 0247b5c, github.com/apache/spark/pull/404
+
+ HOTFIX: Use file name and not paths for excludes
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-14 15:51:54 -0700
+ Commit: 268b535
+
+ [BUGFIX] In-memory columnar storage bug fixes
+ Cheng Lian <lian.cs.zju@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-04-14 15:22:43 -0700
+ Commit: 7dbca68, github.com/apache/spark/pull/374
+
+ [SPARK-1415] Hadoop min split for wholeTextFiles()
+ Xusen Yin <yinxusen@gmail.com>
+ 2014-04-13 13:18:52 -0700
+ Commit: 037fe4d, github.com/apache/spark/pull/376
+
+ SPARK-1480: Clean up use of classloaders
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-13 08:58:37 -0700
+ Commit: 4bc07ee, github.com/apache/spark/pull/398
+
+ [SPARK-1403] Move the class loader creation back to where it was in 0.9.0
+ Bharath Bhushan <manku.timma@outlook.com>
+ 2014-04-12 20:52:29 -0700
+ Commit: ca11919, github.com/apache/spark/pull/322
+
+ [Fix #204] Update out-dated comments
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-12 16:33:38 -0700
+ Commit: c2d160f, github.com/apache/spark/pull/381
+
+ [SPARK-1386] Web UI for Spark Streaming
+ Tathagata Das <tathagata.das1565@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-04-11 23:33:49 -0700
+ Commit: 6aa08c3, github.com/apache/spark/pull/290
+
+ SPARK-1057 (alternative) Remove fastutil
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-11 22:46:47 -0700
+ Commit: 165e06a, github.com/apache/spark/pull/266
+
+ Update WindowedDStream.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-11 20:33:42 -0700
+ Commit: aa8bb11, github.com/apache/spark/pull/390
+
+ [WIP] [SPARK-1328] Add vector statistics
+ Xusen Yin <yinxusen@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 19:43:22 -0700
+ Commit: fdfb45e, github.com/apache/spark/pull/268
+
+ [FIX] make coalesce test deterministic in RDDSuite
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 19:41:40 -0700
+ Commit: 7038b00, github.com/apache/spark/pull/387
+
+ HOTFIX: Ignore python metastore files in RAT checks.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-11 13:23:21 -0700
+ Commit: 6a0f8e3, github.com/apache/spark/pull/393
+
+ [SPARK-1225, 1241] [MLLIB] Add AreaUnderCurve and BinaryClassificationMetrics
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 12:06:13 -0700
+ Commit: f5ace8d, github.com/apache/spark/pull/364
+
+ Some clean up in build/docs
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-11 10:45:27 -0700
+ Commit: 98225a6, github.com/apache/spark/pull/382
+
+ SPARK-1417: Spark on Yarn - spark UI link from resourcemanager is broken
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-11 13:17:48 +0530
+ Commit: 446bb34, github.com/apache/spark/pull/344
+
+ SPARK-1202: Improvements to task killing in the UI.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-10 20:43:56 -0700
+ Commit: 44f654e, github.com/apache/spark/pull/386
+
+ Add Spark v0.9.1 to ec2 launch script and use it as the default
+ Harvey Feng <hyfeng224@gmail.com>
+ 2014-04-10 18:25:54 -0700
+ Commit: 7b4203a, github.com/apache/spark/pull/385
+
+ Set spark.executor.uri from environment variable (needed by Mesos)
+ Ivan Wick <ivanwick+github@gmail.com>
+ 2014-04-10 17:49:30 -0700
+ Commit: 5cd11d5, github.com/apache/spark/pull/311
+
+ SPARK-1202 - Add a "cancel" button in the UI for stages
+ Sundeep Narravula <sundeepn@superduel.local>, Sundeep Narravula <sundeepn@dhcpx-204-110.corp.yahoo.com>
+ 2014-04-10 17:10:11 -0700
+ Commit: 2c55783, github.com/apache/spark/pull/246
+
+ [SQL] Improve column pruning in the optimizer.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-10 16:20:33 -0700
+ Commit: f99401a, github.com/apache/spark/pull/378
+
+ Remove Unnecessary Whitespace's
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-10 15:04:13 -0700
+ Commit: 930b70f, github.com/apache/spark/pull/380
+
+ Update tuning.md
+ Andrew Ash <andrew@andrewash.com>
+ 2014-04-10 14:59:58 -0700
+ Commit: f046662, github.com/apache/spark/pull/384
+
+ Revert "SPARK-1433: Upgrade Mesos dependency to 0.17.0"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-10 14:43:29 -0700
+ Commit: 7b52b66
+
+ SPARK-1428: MLlib should convert non-float64 NumPy arrays to float64 instead of complaining
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-10 11:17:41 -0700
+ Commit: 3bd3129, github.com/apache/spark/pull/356
+
+ [SPARK-1276] Add a HistoryServer to render persisted UI
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-10 10:39:34 -0700
+ Commit: 79820fe, github.com/apache/spark/pull/204
+
+
+Release 1.0.0
+
+ HOTFIX: Add no-arg SparkContext constructor in Java
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-25 20:13:32 -0700
+ Commit: 18c77cb, github.com/apache/spark/pull/878
+
+ [SQL] Minor: Introduce SchemaRDD#aggregate() for simple aggregations
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-25 18:37:44 -0700
+ Commit: a3976a2, github.com/apache/spark/pull/874
+
+ SPARK-1903 Document Spark's network connections
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-25 17:15:47 -0700
+ Commit: 5107a6f, github.com/apache/spark/pull/856
+
+ Fix PEP8 violations in Python mllib.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 17:15:01 -0700
+ Commit: 07f34ca, github.com/apache/spark/pull/871
+
+ Python docstring update for sql.py.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 16:04:17 -0700
+ Commit: 8891495, github.com/apache/spark/pull/869
+
+ Fix PEP8 violations in examples/src/main/python.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 14:48:27 -0700
+ Commit: 3368397, github.com/apache/spark/pull/870
+
+ Added license header for tox.ini.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:47:08 -0700
+ Commit: 7273bfc
+
+ SPARK-1822: Some minor cleanup work on SchemaRDD.count()
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:44:49 -0700
+ Commit: aeffc20, github.com/apache/spark/pull/868
+
+ Added PEP8 style configuration file.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-25 01:32:15 -0700
+ Commit: 291567d, github.com/apache/spark/pull/872
+
+ [SPARK-1822] SchemaRDD.count() should use query optimizer
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-25 00:06:42 -0700
+ Commit: 64d0fb5, github.com/apache/spark/pull/841
+
+ spark-submit: add exec at the end of the script
+ Colin Patrick Mccabe <cmccabe@cloudera.com>
+ 2014-05-24 22:39:27 -0700
+ Commit: 7e59335, github.com/apache/spark/pull/858
+
+ [SPARK-1886] check executor id existence when executor exit
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-24 20:40:19 -0700
+ Commit: b5e9686, github.com/apache/spark/pull/827
+
+ Updated CHANGES.txt
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-25 02:20:13 +0000
+ Commit: 8406092
+
+ SPARK-1911: Emphasize that Spark jars should be built with Java 6.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-24 18:27:00 -0700
+ Commit: 217bd56, github.com/apache/spark/pull/859
+
+ [SPARK-1900 / 1918] PySpark on YARN is broken
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-24 18:01:49 -0700
+ Commit: 12f5ecc, github.com/apache/spark/pull/853
+
+ Update LBFGSSuite.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-05-23 13:02:40 -0700
+ Commit: 9be103a, github.com/apache/spark/pull/815
+
+ Updated scripts for auditing releases
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-22 20:48:55 -0700
+ Commit: 6541ca2, github.com/apache/spark/pull/844
+
+ [SPARK-1896] Respect spark.master (and --master) before MASTER in spark-shell
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-22 20:32:27 -0700
+ Commit: c3b4065, github.com/apache/spark/pull/846
+
+ [SPARK-1897] Respect spark.jars (and --jars) in spark-shell
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-22 20:25:41 -0700
+ Commit: 23cc40e, github.com/apache/spark/pull/849
+
+ Fix UISuite unit test that fails under Jenkins contention
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-22 15:11:05 -0700
+ Commit: a566216, github.com/apache/spark/pull/857
+
+ [SPARK-1870] Make spark-submit --jars work in yarn-cluster mode.
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-22 01:52:50 -0700
+ Commit: 79cd26c, github.com/apache/spark/pull/848
+
+ Configuration documentation updates
+ Reynold Xin <rxin@apache.org>
+ 2014-05-21 18:49:12 -0700
+ Commit: 75af8bd, github.com/apache/spark/pull/851
+
+ [SPARK-1889] [SQL] Apply splitConjunctivePredicates to join condition while finding join ke...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-21 15:37:47 -0700
+ Commit: 6e7934e, github.com/apache/spark/pull/836
+
+ [SPARK-1519] Support minPartitions param of wholeTextFiles() in PySpark
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-21 13:26:53 -0700
+ Commit: 30d1df5, github.com/apache/spark/pull/697
+
+ [Typo] Stoped -> Stopped
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 11:59:05 -0700
+ Commit: 9b8f772, github.com/apache/spark/pull/847
+
+ [Minor] Move JdbcRDDSuite to the correct package
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 01:25:10 -0700
+ Commit: bc6bbfa, github.com/apache/spark/pull/839
+
+ [Docs] Correct example of creating a new SparkConf
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-21 01:23:34 -0700
+ Commit: 7295dd9, github.com/apache/spark/pull/842
+
+ [SPARK-1250] Fixed misleading comments in bin/pyspark, bin/spark-class
+ Sumedh Mungee <smungee@gmail.com>
+ 2014-05-21 01:22:25 -0700
+ Commit: 364c14a, github.com/apache/spark/pull/843
+
+ [Hotfix] Blacklisted flaky HiveCompatibility test
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-20 10:27:12 -0700
+ Commit: b4d93d3, github.com/apache/spark/pull/838
+
+ Updated CHANGES.txt
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-19 23:12:24 -0700
+ Commit: 1c00f2a
+
+ [Spark 1877] ClassNotFoundException when loading RDD with serialized objects
+ Tathagata Das <tathagata.das1565@gmail.com>, Ghidireac <bogdang@u448a5b0a73d45358d94a.ant.amazon.com>
+ 2014-05-19 22:36:24 -0700
+ Commit: 6cbe2a3, github.com/apache/spark/pull/835
+
+ [SPARK-1874][MLLIB] Clean up MLlib sample data
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-19 21:29:33 -0700
+ Commit: 1c6c8b5, github.com/apache/spark/pull/833
+
+ SPARK-1689: Spark application should die when removed by Master
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-19 20:55:26 -0700
+ Commit: 78b6e6f, github.com/apache/spark/pull/832
+
+ [SPARK-1875]NoClassDefFoundError: StringUtils when building with hadoop 1.x and hive
+ witgo <witgo@qq.com>
+ 2014-05-19 19:40:29 -0700
+ Commit: 875c54f, github.com/apache/spark/pull/824
+
+ SPARK-1879. Increase MaxPermSize since some of our builds have many classes
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-19 18:42:28 -0700
+ Commit: 00563e1, github.com/apache/spark/pull/823
+
+ SPARK-1878: Fix the incorrect initialization order
+ zsxwing <zsxwing@gmail.com>
+ 2014-05-19 16:41:31 -0700
+ Commit: 901102c, github.com/apache/spark/pull/822
+
+ [SPARK-1876] Windows fixes to deal with latest distribution layout changes
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-19 15:02:35 -0700
+ Commit: 111c121, github.com/apache/spark/pull/819
+
+ [WIP][SPARK-1871][MLLIB] Improve MLlib guide for v1.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-18 17:00:57 -0700
+ Commit: ecab8a2, github.com/apache/spark/pull/816
+
+ SPARK-1873: Add README.md file when making distributions
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-18 16:51:53 -0700
+ Commit: 8e8b351, github.com/apache/spark/pull/818
+
+ Fix spark-submit path in spark-shell & pyspark
+ Neville Li <neville@spotify.com>
+ 2014-05-18 13:31:23 -0700
+ Commit: e06e4b0, github.com/apache/spark/pull/812
+
+ Make deprecation warning less severe
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-16 22:58:47 -0700
+ Commit: 3b3d7c8, github.com/apache/spark/pull/810
+
+ [SPARK-1824] Remove <master> from Python examples
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-16 22:36:23 -0700
+ Commit: 03b4242, github.com/apache/spark/pull/802
+
+ [SPARK-1808] Route bin/pyspark through Spark submit
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-16 22:34:38 -0700
+ Commit: 318739a, github.com/apache/spark/pull/799
+
+ Version bump of spark-ec2 scripts
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-16 21:42:14 -0700
+ Commit: 9cd12f3, github.com/apache/spark/pull/809
+
+ SPARK-1864 Look in spark conf instead of system properties when propagating configuration to executors.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-16 20:25:10 -0700
+ Commit: a16a19f, github.com/apache/spark/pull/808
+
+ Tweaks to Mesos docs
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-16 17:35:05 -0700
+ Commit: 2ba6711, github.com/apache/spark/pull/806
+
+ [SQL] Implement between in hql
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-16 11:47:00 -0700
+ Commit: 386b31c, github.com/apache/spark/pull/804
+
+ bugfix: overflow of graphx Edge compare function
+ Zhen Peng <zhenpeng01@baidu.com>
+ 2014-05-16 11:37:18 -0700
+ Commit: ff47cdc, github.com/apache/spark/pull/769
+
+ SPARK-1862: Support for MapR in the Maven build.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-15 23:31:43 -0700
+ Commit: eec4dd8, github.com/apache/spark/pull/803
+
+ [Spark-1461] Deferred Expression Evaluation (short-circuit evaluation)
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-05-15 22:12:34 -0700
+ Commit: eac4ee8, github.com/apache/spark/pull/446
+
+ SPARK-1860: Do not cleanup application work/ directories by default
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-15 21:37:58 -0700
+ Commit: 5441471, github.com/apache/spark/pull/800
+
+ Typos in Spark
+ Huajian Mao <huajianmao@gmail.com>
+ 2014-05-15 18:20:16 -0700
+ Commit: a2742d8, github.com/apache/spark/pull/798
+
+ Fixes a misplaced comment.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-15 16:58:37 -0700
+ Commit: 2e418f5, github.com/apache/spark/pull/788
+
+ [SQL] Fix tiny/small ints from HiveMetastore.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-15 16:50:42 -0700
+ Commit: ffa9c49, github.com/apache/spark/pull/797
+
+ SPARK-1803 Replaced colon in filenames with a dash
+ Stevo Slavić <sslavic@gmail.com>, Stevo Slavic <sslavic@gmail.com>
+ 2014-05-15 16:44:14 -0700
+ Commit: 22f261a, github.com/apache/spark/pull/739
+
+ SPARK-1851. Upgrade Avro dependency to 1.7.6 so Spark can read Avro file...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-15 16:35:39 -0700
+ Commit: 3587057, github.com/apache/spark/pull/795
+
+ [SPARK-1741][MLLIB] add predict(JavaRDD) to RegressionModel, ClassificationModel, and KMeans
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-15 11:59:59 -0700
+ Commit: bc9a96e, github.com/apache/spark/pull/670
+
+ [SPARK-1819] [SQL] Fix GetField.nullable.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-15 11:21:33 -0700
+ Commit: f9eeddc, github.com/apache/spark/pull/757
+
+ [SPARK-1845] [SQL] Use AllScalaRegistrar for SparkSqlSerializer to register serializers of ...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-15 11:20:21 -0700
+ Commit: 7515367, github.com/apache/spark/pull/790
+
+ SPARK-1846 Ignore logs directory in RAT checks
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-15 11:05:39 -0700
+ Commit: aa5f989, github.com/apache/spark/pull/793
+
+ HOTFIX: Don't build Javadoc in Maven when creating releases.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 23:48:03 -0700
+ Commit: 88f1da3
+
+ fix different versions of commons-lang dependency and apache/spark#746 addendum
+ witgo <witgo@qq.com>
+ 2014-05-14 22:26:26 -0700
+ Commit: 31b853c, github.com/apache/spark/pull/754
+
+ Package docs
+ Prashant Sharma <prashant.s@imaginea.com>, Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 22:24:41 -0700
+ Commit: c02d614, github.com/apache/spark/pull/785
+
+ Documentation: Encourage use of reduceByKey instead of groupByKey.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 22:24:04 -0700
+ Commit: f2faa37, github.com/apache/spark/pull/784
+
+ Add language tabs and Python version to interactive part of quick-start
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-14 21:45:20 -0700
+ Commit: 976784b, github.com/apache/spark/pull/782
+
+ [SPARK-1840] SparkListenerBus prints out scary error message when terminated normally
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-14 21:13:41 -0700
+ Commit: ba87123, github.com/apache/spark/pull/783
+
+ default task number misleading in several places
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-05-14 18:20:20 -0700
+ Commit: 9f0f2ec, github.com/apache/spark/pull/766
+
+ [SPARK-1826] fix the head notation of package object dsl
+ wangfei <scnbwf@yeah.net>
+ 2014-05-14 17:59:11 -0700
+ Commit: fdf9717, github.com/apache/spark/pull/765
+
+ [Typo] propertes -> properties
+ andrewor14 <andrewor14@gmail.com>
+ 2014-05-14 17:54:53 -0700
+ Commit: 5ca3096, github.com/apache/spark/pull/780
+
+ [SPARK-1696][MLLIB] use alpha in dense dspr
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-14 17:18:30 -0700
+ Commit: d6f1a75, github.com/apache/spark/pull/778
+
+ [FIX] do not load defaults when testing SparkConf in pyspark
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-14 14:57:17 -0700
+ Commit: 31faec7, github.com/apache/spark/pull/775
+
+ SPARK-1833 - Have an empty SparkContext constructor.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 12:53:30 -0700
+ Commit: 8e13ab2, github.com/apache/spark/pull/774
+
+ SPARK-1829 Sub-second durations shouldn't round to "0 s"
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-14 12:01:14 -0700
+ Commit: 530bdf7, github.com/apache/spark/pull/768
+
+ Fix: sbt test throw an java.lang.OutOfMemoryError: PermGen space
+ witgo <witgo@qq.com>
+ 2014-05-14 11:19:26 -0700
+ Commit: 379f733, github.com/apache/spark/pull/773
+
+ Adding back hive support
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 10:21:27 -0700
+ Commit: e8ca397
+
+ [SPARK-1620] Handle uncaught exceptions in function run by Akka scheduler
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-05-14 10:07:25 -0700
+ Commit: 9ff9078, github.com/apache/spark/pull/622
+
+ SPARK-1828: Created forked version of hive-exec that doesn't bundle other dependencies
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-14 09:51:01 -0700
+ Commit: 34f6fa9, github.com/apache/spark/pull/767
+
+ SPARK-1818 Freshen Mesos documentation
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-14 09:45:33 -0700
+ Commit: fc6b652, github.com/apache/spark/pull/756
+
+ SPARK-1827. LICENSE and NOTICE files need a refresh to contain transitive dependency info
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-14 09:38:33 -0700
+ Commit: 7083282, github.com/apache/spark/pull/770
+
+ Fixed streaming examples docs to use run-example instead of spark-submit
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-14 04:17:32 -0700
+ Commit: c7571d8, github.com/apache/spark/pull/722
+
+ [SPARK-1769] Executor loss causes NPE race condition
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-14 00:54:33 -0700
+ Commit: 69ec314, github.com/apache/spark/pull/762
+
+ Fix dep exclusion: avro-ipc, not avro, depends on netty.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-05-14 00:37:57 -0700
+ Commit: b3d9878, github.com/apache/spark/pull/763
+
+ SPARK-1801. expose InterruptibleIterator and TaskKilledException in deve...
+ Koert Kuipers <koert@tresata.com>
+ 2014-05-14 00:10:12 -0700
+ Commit: 7da80a3, github.com/apache/spark/pull/764
+
+ [SQL] Improve column pruning.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-13 23:27:22 -0700
+ Commit: f66f766, github.com/apache/spark/pull/729
+
+ Revert "[SPARK-1784] Add a new partitioner to allow specifying # of keys per partition"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-13 23:25:19 -0700
+ Commit: 721194b
+
+ Implement ApproximateCountDistinct for SparkSql
+ larvaboy <larvaboy@gmail.com>
+ 2014-05-13 21:26:08 -0700
+ Commit: 92b0ec9, github.com/apache/spark/pull/737
+
+ [SPARK-1784] Add a new partitioner to allow specifying # of keys per partition
+ Syed Hashmi <shashmi@cloudera.com>
+ 2014-05-13 21:24:23 -0700
+ Commit: 66fe479, github.com/apache/spark/pull/721
+
+ [SQL] Make it possible to create Java/Python SQLContexts from an existing Scala SQLContext.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-13 21:23:51 -0700
+ Commit: 618b3e6, github.com/apache/spark/pull/761
+
+ [SPARK-1527] change rootDir*.getName to rootDir*.getAbsolutePath
+ Ye Xianjin <advancedxy@gmail.com>
+ 2014-05-13 19:03:51 -0700
+ Commit: ef5e9d7, github.com/apache/spark/pull/436
+
+ [SPARK-1816] LiveListenerBus dies if a listener throws an exception
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-13 18:32:32 -0700
+ Commit: 3892ec5, github.com/apache/spark/pull/759
+
+ SPARK-1791 - SVM implementation does not use threshold parameter
+ Andrew Tulloch <andrew@tullo.ch>
+ 2014-05-13 17:31:27 -0700
+ Commit: d6994f4, github.com/apache/spark/pull/725
+
+ BUILD: Add more content to make-distribution.sh.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 23:02:54 -0700
+ Commit: 716462c
+
+ Adding CHANGES.txt file and removing YARN support for now
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 20:21:23 -0700
+ Commit: fa2d4d8
+
+ SPARK-1815. SparkContext should not be marked DeveloperApi
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-12 20:08:30 -0700
+ Commit: 31d54c0, github.com/apache/spark/pull/753
+
+ [SPARK-1753 / 1773 / 1814] Update outdated docs for spark-submit, YARN, standalone etc.
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 19:44:14 -0700
+ Commit: b9e41f4, github.com/apache/spark/pull/701
+
+ [SPARK-1780] Non-existent SPARK_DAEMON_OPTS is lurking around
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 19:42:35 -0700
+ Commit: 5ef24a0, github.com/apache/spark/pull/751
+
+ SPARK-1757 Failing test for saving null primitives with .saveAsParquetFile()
+ Andrew Ash <andrew@andrewash.com>, Michael Armbrust <michael@databricks.com>
+ 2014-05-12 19:23:39 -0700
+ Commit: b52ac0e, github.com/apache/spark/pull/690
+
+ Modify a typo in monitoring.md
+ Kousuke Saruta <sarutak@oss.nttdata.co.jp>
+ 2014-05-12 19:21:06 -0700
+ Commit: 89b56d7, github.com/apache/spark/pull/698
+
+ L-BFGS Documentation
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-12 19:20:24 -0700
+ Commit: bad4c9d, github.com/apache/spark/pull/702
+
+ Typo: resond -> respond
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-12 18:46:28 -0700
+ Commit: 1fbebca, github.com/apache/spark/pull/743
+
+ [SQL] Make Hive Metastore conversion functions publicly visible.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-12 18:40:30 -0700
+ Commit: 24cc933, github.com/apache/spark/pull/750
+
+ [SPARK-1736] Spark submit for Windows
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-12 17:39:40 -0700
+ Commit: 59695b3, github.com/apache/spark/pull/745
+
+ SPARK-1802. (Addendium) Audit dependency graph when Spark is built with -Pyarn
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 17:35:29 -0700
+ Commit: 02caa7e, github.com/apache/spark/pull/746
+
+ SPARK-1623: Use File objects instead of String's in HTTPBroadcast
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 17:27:28 -0700
+ Commit: c294f37, github.com/apache/spark/pull/749
+
+ Rename testExecutorEnvs --> executorEnvs.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 17:09:13 -0700
+ Commit: e9d602d, github.com/apache/spark/pull/747
+
+ Adding hadoop-2.2 profile to the build
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 15:40:48 -0700
+ Commit: b66051e
+
+ Rollback versions for 1.0.0-rc4
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 15:23:53 -0700
+ Commit: 51142b7
+
+ SPARK-1802. Audit dependency graph when Spark is built with -Phive
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 14:17:25 -0700
+ Commit: e185281, github.com/apache/spark/pull/744
+
+ SPARK-1798. Tests should clean up temp files
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-12 14:16:19 -0700
+ Commit: 14515b4, github.com/apache/spark/pull/732
+
+ BUILD: Include Hive with default packages when creating a release
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 13:20:23 -0700
+ Commit: 722ecaa
+
+ SPARK-1786: Reopening PR 724
+ Ankur Dave <ankurdave@gmail.com>, Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-12 13:05:24 -0700
+ Commit: 642ad49, github.com/apache/spark/pull/742
+
+ SPARK-1806: Upgrade Mesos dependency to 0.18.1
+ Bernardo Gomez Palacio <bernardo.gomezpalacio@gmail.com>
+ 2014-05-12 11:10:28 -0700
+ Commit: 0be8b45, github.com/apache/spark/pull/741
+
+ SPARK-1772 Stop catching Throwable, let Executors die
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-12 11:08:52 -0700
+ Commit: c88adbb, github.com/apache/spark/pull/715
+
+ Revert "SPARK-1786: Edge Partition Serialization"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-12 10:51:01 -0700
+ Commit: 19ccf20
+
+ SPARK-1786: Edge Partition Serialization
+ Ankur Dave <ankurdave@gmail.com>, Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-11 19:20:42 -0700
+ Commit: 09e7aa4, github.com/apache/spark/pull/724
+
+ Fix error in 2d Graph Partitioner
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-05-11 18:33:46 -0700
+ Commit: f84b798, github.com/apache/spark/pull/709
+
+ SPARK-1652: Set driver memory correctly in spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-11 18:17:34 -0700
+ Commit: 2eea663, github.com/apache/spark/pull/730
+
+ SPARK-1770: Load balance elements when repartitioning.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-11 17:11:55 -0700
+ Commit: 5d69699, github.com/apache/spark/pull/727
+
+ remove outdated runtime Information scala home
+ witgo <witgo@qq.com>
+ 2014-05-11 14:34:27 -0700
+ Commit: 8097bb2, github.com/apache/spark/pull/728
+
+ Revert "Enabled incremental build that comes with sbt 0.13.2"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-10 21:08:53 -0700
+ Commit: 758e543
+
+ Enabled incremental build that comes with sbt 0.13.2
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-10 21:08:04 -0700
+ Commit: 71ce7eb, github.com/apache/spark/pull/525
+
+ [SPARK-1774] Respect SparkSubmit --jars on YARN (client)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-10 20:58:02 -0700
+ Commit: 012f904, github.com/apache/spark/pull/710
+
+ SPARK-1789. Multiple versions of Netty dependencies cause FlumeStreamSuite failure
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-10 20:50:40 -0700
+ Commit: c7253da, github.com/apache/spark/pull/723
+
+ Unify GraphImpl RDDs + other graph load optimizations
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-05-10 14:48:07 -0700
+ Commit: 4e9a0cb, github.com/apache/spark/pull/497
+
+ [SPARK-1690] Tolerating empty elements when saving Python RDD to text files
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-10 14:01:08 -0700
+ Commit: ac86af8, github.com/apache/spark/pull/644
+
+ Add Python includes to path before depickling broadcast values
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-10 13:02:13 -0700
+ Commit: 2a669a7, github.com/apache/spark/pull/656
+
+ fix broken in link in python docs
+ Andy Konwinski <andykonwinski@gmail.com>
+ 2014-05-10 12:46:51 -0700
+ Commit: 71ad53f, github.com/apache/spark/pull/650
+
+ SPARK-1708. Add a ClassTag on Serializer and things that depend on it
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-10 12:10:24 -0700
+ Commit: 9fbb22c, github.com/apache/spark/pull/700
+
+ [SPARK-1778] [SQL] Add 'limit' transformation to SchemaRDD.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-10 12:03:27 -0700
+ Commit: 7486474, github.com/apache/spark/pull/711
+
+ [SQL] Upgrade parquet library.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-10 11:48:01 -0700
+ Commit: a61b71c, github.com/apache/spark/pull/684
+
+ [SPARK-1644] The org.datanucleus:* should not be packaged into spark-assembly-*.jar
+ witgo <witgo@qq.com>
+ 2014-05-10 10:15:04 -0700
+ Commit: 2a878da, github.com/apache/spark/pull/688
+
+ SPARK-1686: keep schedule() calling in the main thread
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-05-09 21:50:23 -0700
+ Commit: adf8cdd, github.com/apache/spark/pull/639
+
+ SPARK-1770: Revert accidental(?) fix
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-09 14:51:34 -0700
+ Commit: 8202276, github.com/apache/spark/pull/716
+
+ [SPARK-1760]: fix building spark with maven documentation
+ witgo <witgo@qq.com>
+ 2014-05-09 01:51:26 -0700
+ Commit: 80f292a, github.com/apache/spark/pull/712
+
+ Converted bang to ask to avoid scary warning when a block is removed
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-08 22:34:08 -0700
+ Commit: b8c17e3, github.com/apache/spark/pull/708
+
+ MINOR: Removing dead code.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-08 22:33:06 -0700
+ Commit: 1d56cd5
+
+ SPARK-1775: Unneeded lock in ShuffleMapTask.deserializeInfo
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-08 22:30:17 -0700
+ Commit: 5c8e8de, github.com/apache/spark/pull/707
+
+ SPARK-1565 (Addendum): Replace `run-example` with `spark-submit`.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-08 22:26:17 -0700
+ Commit: f6323eb, github.com/apache/spark/pull/704
+
+ [SPARK-1631] Correctly set the Yarn app name when launching the AM.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-05-08 20:46:11 -0700
+ Commit: 7e19334, github.com/apache/spark/pull/539
+
+ [SPARK-1755] Respect SparkSubmit --name on YARN
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-08 20:45:29 -0700
+ Commit: 666bebe, github.com/apache/spark/pull/699
+
+ Include the sbin/spark-config.sh in spark-executor
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-08 20:43:37 -0700
+ Commit: ab91227, github.com/apache/spark/pull/651
+
+ Bug fix of sparse vector conversion
+ Funes <tianshaocun@gmail.com>, funes <tianshaocun@gmail.com>
+ 2014-05-08 17:54:10 -0700
+ Commit: 9ed17ff, github.com/apache/spark/pull/661
+
+ [SPARK-1157][MLlib] Bug fix: lossHistory should exclude rejection steps, and remove miniBatch
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-08 17:53:22 -0700
+ Commit: 3452997, github.com/apache/spark/pull/582
+
+ MLlib documentation fix
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-05-08 17:52:32 -0700
+ Commit: d81d626, github.com/apache/spark/pull/703
+
+ Fixing typo in als.py
+ Evan Sparks <evan.sparks@gmail.com>
+ 2014-05-08 13:07:30 -0700
+ Commit: 98944a9, github.com/apache/spark/pull/696
+
+ [SPARK-1754] [SQL] Add missing arithmetic DSL operations.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-05-08 15:31:47 -0700
+ Commit: 6f701ff, github.com/apache/spark/pull/689
+
+ [SPARK-1745] Move interrupted flag from TaskContext constructor (minor)
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-08 12:13:07 -0700
+ Commit: ee63321, github.com/apache/spark/pull/675
+
+ SPARK-1565, update examples to be used with spark-submit script.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-05-08 10:23:05 -0700
+ Commit: 30cfa8d, github.com/apache/spark/pull/552
+
+ [SQL] Improve SparkSQL Aggregates
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-08 01:08:43 -0400
+ Commit: 8f3b925, github.com/apache/spark/pull/683
+
+ Use numpy directly for matrix multiply.
+ Evan Sparks <evan.sparks@gmail.com>
+ 2014-05-08 00:24:36 -0400
+ Commit: 010040f, github.com/apache/spark/pull/687
+
+ SPARK-1668: Add implicit preference as an option to examples/MovieLensALS
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-08 00:15:05 -0400
+ Commit: 35aa244, github.com/apache/spark/pull/597
+
+ SPARK-1544 Add support for deep decision trees.
+ Manish Amde <manish9ue@gmail.com>, manishamde <manish9ue@gmail.com>, Evan Sparks <sparks@cs.berkeley.edu>
+ 2014-05-07 17:08:38 -0700
+ Commit: c7b2704, github.com/apache/spark/pull/475
+
+ Update GradientDescentSuite.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-05-07 16:02:55 -0700
+ Commit: 0972b62, github.com/apache/spark/pull/588
+
+ [SPARK-1743][MLLIB] add loadLibSVMFile and saveAsLibSVMFile to pyspark
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-07 16:01:11 -0700
+ Commit: bb90e87, github.com/apache/spark/pull/672
+
+ SPARK-1569 Spark on Yarn, authentication broken by pr299
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-07 15:51:53 -0700
+ Commit: 879eeee, github.com/apache/spark/pull/649
+
+ [SPARK-1688] Propagate PySpark worker stderr to driver
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-07 14:35:22 -0700
+ Commit: 82c8e89, github.com/apache/spark/pull/603
+
+ Typo fix: fetchting -> fetching
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-07 17:24:49 -0400
+ Commit: 0759ee7, github.com/apache/spark/pull/680
+
+ Nicer logging for SecurityManager startup
+ Andrew Ash <andrew@andrewash.com>
+ 2014-05-07 17:24:12 -0400
+ Commit: 69e2726, github.com/apache/spark/pull/678
+
+ [SQL] Fix Performance Issue in data type casting
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-05-07 16:54:58 -0400
+ Commit: 82ceda2, github.com/apache/spark/pull/679
+
+ SPARK-1579: Clean up PythonRDD and avoid swallowing IOExceptions
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-07 09:48:31 -0700
+ Commit: 18caa8c, github.com/apache/spark/pull/640
+
+ [SPARK-1460] Returning SchemaRDD instead of normal RDD on Set operations...
+ Kan Zhang <kzhang@apache.org>
+ 2014-05-07 09:41:31 -0700
+ Commit: da9f9e0, github.com/apache/spark/pull/448
+
+ [WIP][Spark-SQL] Optimize the Constant Folding for Expression
+ Cheng Hao <hao.cheng@intel.com>, Michael Armbrust <michael@databricks.com>
+ 2014-05-07 03:37:12 -0400
+ Commit: 756c969, github.com/apache/spark/pull/482
+
+ SPARK-1746: Support setting SPARK_JAVA_OPTS on executors for backwards compatibility
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-07 00:11:05 -0700
+ Commit: 00fac73, github.com/apache/spark/pull/676
+
+ [HOTFIX] SPARK-1637: There are some Streaming examples added after the PR #571 was last updated.
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-06 21:55:05 -0700
+ Commit: ade4756, github.com/apache/spark/pull/673
+
+ Proposal: clarify Scala programming guide on caching ...
+ Ethan Jewett <esjewett@gmail.com>
+ 2014-05-06 20:50:08 -0700
+ Commit: 51e2775, github.com/apache/spark/pull/668
+
+ SPARK-1727. Correct small compile errors, typos, and markdown issues in (primarly) MLlib docs
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-06 20:07:22 -0700
+ Commit: 514ee93, github.com/apache/spark/pull/653
+
+ SPARK-1637: Clean up examples for 1.0
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-06 17:27:52 -0700
+ Commit: 8cfebf5, github.com/apache/spark/pull/571
+
+ SPARK-1737: Warn rather than fail when Java 7+ is used to create distributions
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-06 15:41:46 -0700
+ Commit: d8f1b33, github.com/apache/spark/pull/669
+
+ [SPARK-1549] Add Python support to spark-submit
+ Matei Zaharia <matei@databricks.com>
+ 2014-05-06 15:12:35 -0700
+ Commit: d7ddb26, github.com/apache/spark/pull/664
+
+ SPARK-1734: spark-submit throws an exception: Exception in thread "main"...
+ witgo <witgo@qq.com>
+ 2014-05-06 14:17:39 -0700
+ Commit: 48cc9a9, github.com/apache/spark/pull/665
+
+ [SPARK-1685] Cancel retryTimer on restart of Worker or AppClient
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-05-06 12:53:39 -0700
+ Commit: 0aaa2c6, github.com/apache/spark/pull/602
+
+ Fix two download suggestions in the docs:
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-06 12:07:46 -0700
+ Commit: 1083f2b, github.com/apache/spark/pull/662
+
+ SPARK-1474: Spark on yarn assembly doesn't include AmIpFilter
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-06 12:00:09 -0700
+ Commit: 0c3e415, github.com/apache/spark/pull/406
+
+ Update OpenHashSet.scala
+ ArcherShao <ArcherShao@users.noreply.github.com>
+ 2014-05-06 10:12:59 -0700
+ Commit: 4ff3929, github.com/apache/spark/pull/667
+
+ [SQL] SPARK-1732 - Support for null primitive values.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-05 22:59:42 -0700
+ Commit: 39ac62d, github.com/apache/spark/pull/658
+
+ [SPARK-1735] Add the missing special profiles to make-distribution.sh
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 22:14:47 -0700
+ Commit: 4708eff, github.com/apache/spark/pull/660
+
+ [SPARK-1678][SPARK-1679] In-memory compression bug fix and made compression configurable, disabled by default
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-05 19:38:59 -0700
+ Commit: 2853e56, github.com/apache/spark/pull/608
+
+ [SPARK-1594][MLLIB] Cleaning up MLlib APIs and guide
+ Xiangrui Meng <meng@databricks.com>
+ 2014-05-05 18:32:54 -0700
+ Commit: 32c960a, github.com/apache/spark/pull/524
+
+ Expose SparkListeners and relevant classes as DeveloperApi
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 18:32:14 -0700
+ Commit: a5f765c, github.com/apache/spark/pull/648
+
+ SPARK-1728. JavaRDDLike.mapPartitionsWithIndex requires ClassTag
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-05 18:26:34 -0700
+ Commit: 01e3ff0, github.com/apache/spark/pull/657
+
+ [SPARK-1681] Include datanucleus jars in Spark Hive distribution
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-05 16:28:07 -0700
+ Commit: 4d0dd50, github.com/apache/spark/pull/610
+
+ [SPARK-1504], [SPARK-1505], [SPARK-1558] Updated Spark Streaming guide
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-05-05 15:28:19 -0700
+ Commit: 1fac4ec, github.com/apache/spark/pull/652
+
+ SPARK-1721: Reset the thread classLoader in the Mesos Executor
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-05-05 11:19:35 -0700
+ Commit: 80f4360, github.com/apache/spark/pull/620
+
+ SPARK-1556. jets3t dep doesn't update properly with newer Hadoop versions
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-05 10:33:49 -0700
+ Commit: 5d72283, github.com/apache/spark/pull/629
+
+ Updated doc for spark.closure.serializer to indicate only Java serializer work.
+ Reynold Xin <rxin@apache.org>
+ 2014-05-05 00:52:06 -0700
+ Commit: 6be7226, github.com/apache/spark/pull/642
+
+ Address SPARK-1717
+ msiddalingaiah <madhu@madhu.com>
+ 2014-05-04 21:59:10 -0700
+ Commit: b5c62c8, github.com/apache/spark/pull/641
+
+ SPARK-1710: spark-submit should print better errors than "InvocationTargetException"
+ Sandeep <sandeep@techaddict.me>
+ 2014-05-04 20:51:53 -0700
+ Commit: afcb9ae, github.com/apache/spark/pull/630
+
+ EC2 script should exit with non-zero code on UsageError
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-05-04 20:36:51 -0700
+ Commit: 7305278, github.com/apache/spark/pull/638
+
+ SPARK-1693: Most of the tests throw a java.lang.SecurityException when s...
+ witgo <witgo@qq.com>
+ 2014-05-04 17:48:52 -0700
+ Commit: ec0bce1, github.com/apache/spark/pull/628
+
+ SPARK-1629. Addendum: Depend on commons lang3 (already used by tachyon) as it's used in ReplSuite, and return to use lang3 utility in Utils.scala
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-04 17:43:28 -0700
+ Commit: 4505bc2, github.com/apache/spark/pull/635
+
+ SPARK-1703 Warn users if Spark is run on JRE6 but compiled with JDK7.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-04 12:22:23 -0700
+ Commit: 2f091d5, github.com/apache/spark/pull/627
+
+ SPARK-1663. (Addendum) Fix signature of one version of JavaPairRDDStream.reduceByKeyAndWindow()
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-04 11:55:29 -0700
+ Commit: 40d05a4, github.com/apache/spark/pull/633
+
+ SPARK-1658: Correctly identify if maven is installed and working
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-05-04 11:08:39 -0700
+ Commit: 2ee5f04, github.com/apache/spark/pull/580
+
+ The default version of yarn is equal to the hadoop version
+ witgo <witgo@qq.com>
+ 2014-05-03 23:32:12 -0700
+ Commit: acbf307, github.com/apache/spark/pull/626
+
+ Whitelist Hive Tests
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-03 23:13:51 -0700
+ Commit: e88a636, github.com/apache/spark/pull/596
+
+ [SQL] Better logging when applying rules.
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-03 18:38:44 -0700
+ Commit: e24d5cd, github.com/apache/spark/pull/616
+
+ EC2 configurable workers
+ Allan Douglas R. de Oliveira <allan@chaordicsystems.com>
+ 2014-05-03 16:52:19 -0700
+ Commit: 8406ac4, github.com/apache/spark/pull/612
+
+ SPARK-1689 AppClient should indicate app is dead() when removed
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-03 13:27:10 -0700
+ Commit: 36e687d, github.com/apache/spark/pull/605
+
+ [Bugfix] Tachyon file cleanup logical error
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-05-03 13:23:52 -0700
+ Commit: bc3bfea, github.com/apache/spark/pull/575
+
+ SPARK-1663. Corrections for several compile errors in streaming code examples, and updates to follow API changes
+ Sean Owen <sowen@cloudera.com>
+ 2014-05-03 12:31:31 -0700
+ Commit: 08c4d11, github.com/apache/spark/pull/589
+
+ [WIP] SPARK-1676: Cache Hadoop UGIs by default to prevent FileSystem leak
+ Thomas Graves <tgraves@apache.org>
+ 2014-05-03 10:59:05 -0700
+ Commit: 0441515, github.com/apache/spark/pull/621
+
+ Update SchemaRDD.scala
+ ArcherShao <ArcherShao@users.noreply.github.com>
+ 2014-05-03 00:17:36 -0700
+ Commit: 34f22bc, github.com/apache/spark/pull/619
+
+ SPARK-1700: Close socket file descriptors on task completion
+ Aaron Davidson <aaron@databricks.com>
+ 2014-05-02 23:55:13 -0700
+ Commit: d2cbd3d, github.com/apache/spark/pull/623
+
+ SPARK-1492. Update Spark YARN docs to use spark-submit
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-05-02 21:42:31 -0700
+ Commit: a314342, github.com/apache/spark/pull/601
+
+ delete no use var
+ wangfei <wangfei_hello@126.com>
+ 2014-05-02 21:34:54 -0700
+ Commit: b65def7, github.com/apache/spark/pull/613
+
+ SPARK-1695: java8-tests compiler error: package com.google.common.co...
+ witgo <witgo@qq.com>
+ 2014-05-02 12:40:27 -0700
+ Commit: d28c058, github.com/apache/spark/pull/611
+
+ Add tests for FileLogger, EventLoggingListener, and ReplayListenerBus
+ Andrew Or <andrewor14@gmail.com>
+ 2014-05-01 21:42:06 -0700
+ Commit: d4c8af8, github.com/apache/spark/pull/591
+
+ SPARK-1659: improvements spark-submit usage
+ witgo <witgo@qq.com>
+ 2014-05-01 21:39:40 -0700
+ Commit: 18595dd, github.com/apache/spark/pull/581
+
+ fix the spelling mistake
+ wangfei <wangfei_hello@126.com>
+ 2014-05-01 21:37:22 -0700
+ Commit: 35ca6c5, github.com/apache/spark/pull/614
+
+ [SQL] SPARK-1661 - Fix regex_serde test
+ Michael Armbrust <michael@databricks.com>
+ 2014-05-01 21:32:43 -0700
+ Commit: d339b33, github.com/apache/spark/pull/595
+
+ SPARK-1691: Support quoted arguments inside of spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-05-01 01:15:51 -0700
+ Commit: dd601bf, github.com/apache/spark/pull/609
+
+ Fix SPARK-1629: Spark should inline use of commons-lang `SystemUtils.IS_...
+ witgo <witgo@qq.com>
+ 2014-04-30 09:49:45 -0700
+ Commit: 74bb88b, github.com/apache/spark/pull/569
+
+ SPARK-1004. PySpark on YARN
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-29 23:24:34 -0700
+ Commit: 177361c, github.com/apache/spark/pull/30
+
+ Handle the vals that never used
+ WangTao <barneystinson@aliyun.com>
+ 2014-04-29 22:07:20 -0700
+ Commit: b0ded1f, github.com/apache/spark/pull/565
+
+ Args for worker rather than master
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-29 22:05:40 -0700
+ Commit: 775020f, github.com/apache/spark/pull/587
+
+ [SPARK-1646] Micro-optimisation of ALS
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-29 22:04:34 -0700
+ Commit: 92269f9, github.com/apache/spark/pull/568
+
+ [SPARK-1674] fix interrupted system call error in pyspark's RDD.pipe
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-29 18:06:45 -0700
+ Commit: 919ed31, github.com/apache/spark/pull/594
+
+ SPARK-1588. Restore SPARK_YARN_USER_ENV and SPARK_JAVA_OPTS for YARN.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-29 12:54:02 -0700
+ Commit: 5f48721, github.com/apache/spark/pull/586
+
+ SPARK-1509: add zipWithIndex zipWithUniqueId methods to java api
+ witgo <witgo@qq.com>
+ 2014-04-29 11:30:47 -0700
+ Commit: 9754d1b, github.com/apache/spark/pull/423
+
+ SPARK-1557 Set permissions on event log files/directories
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-29 09:19:48 -0500
+ Commit: bccd13e, github.com/apache/spark/pull/538
+
+ HOTFIX: minor change to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:59:38 -0700
+ Commit: c27ce2b
+
+ HOTFIX: minor change to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:53:32 -0700
+ Commit: 838cb0e
+
+ [SPARK-1636][MLLIB] Move main methods to examples
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-29 00:41:03 -0700
+ Commit: aa519e3, github.com/apache/spark/pull/584
+
+ Minor fix to python table caching API.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-29 00:36:15 -0700
+ Commit: 0995787, github.com/apache/spark/pull/585
+
+ HOTFIX: Bug in release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-29 00:10:17 -0700
+ Commit: 4ed58aa
+
+ Manual revert of rc2 version changes.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 22:59:09 -0700
+ Commit: 2863344
+
+ Improved build configuration
+ witgo <witgo@qq.com>
+ 2014-04-28 22:50:51 -0700
+ Commit: ee96460, github.com/apache/spark/pull/480
+
+ SPARK-1652: Remove incorrect deprecation warning in spark-submit
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 18:14:59 -0700
+ Commit: 42ba706, github.com/apache/spark/pull/578
+
+ SPARK-1654 and SPARK-1653: Fixes in spark-submit.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 17:29:22 -0700
+ Commit: 2c9ce20, github.com/apache/spark/pull/576
+
+ SPARK-1652: Spark submit should fail gracefully if YARN not enabled
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 17:26:57 -0700
+ Commit: 38bf23e, github.com/apache/spark/pull/579
+
+ Changes to dev release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-28 13:58:42 -0700
+ Commit: 32d9db3
+
+ [SPARK-1633][Streaming] Java API unit test and example for custom streaming receiver in Java
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-28 13:58:09 -0700
+ Commit: 6d89faf, github.com/apache/spark/pull/558
+
+ [SQL]Append some missing types for HiveUDF
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-04-27 23:59:42 -0700
+ Commit: 42cb3b4, github.com/apache/spark/pull/459
+
+ Update the import package name for TestHive in sbt shell
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-04-27 23:57:29 -0700
+ Commit: eb9308e, github.com/apache/spark/pull/574
+
+ Fix SPARK-1609: Executor fails to start when Command.extraJavaOptions contains multiple Java options
+ witgo <witgo@qq.com>
+ 2014-04-27 19:41:02 -0700
+ Commit: 7bbf313, github.com/apache/spark/pull/547
+
+ SPARK-1145: Memory mapping with many small blocks can cause JVM allocation failures
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 17:40:56 -0700
+ Commit: 2f24159, github.com/apache/spark/pull/43
+
+ HOTFIX: Minor patch to merge script.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 15:45:17 -0700
+ Commit: 99285d0
+
+ SPARK-1651: Delete existing deployment directory
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-04-27 15:50:48 -0700
+ Commit: 3c6c6c2, github.com/apache/spark/pull/573
+
+ SPARK-1648 Support closing JIRA's as part of merge script.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-27 15:41:57 -0700
+ Commit: da26f9b, github.com/apache/spark/pull/570
+
+ SPARK-1650: Correctly identify maven project version
+ Rahul Singhal <rahul.singhal@guavus.com>
+ 2014-04-27 15:17:06 -0700
+ Commit: 98b13e0, github.com/apache/spark/pull/572
+
+ SPARK-1606: Infer user application arguments instead of requiring --arg.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-26 19:24:29 -0700
+ Commit: ce57624, github.com/apache/spark/pull/563
+
+ SPARK-1467: Make StorageLevel.apply() factory methods Developer APIs
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-26 19:04:33 -0700
+ Commit: 18ecc63, github.com/apache/spark/pull/551
+
+ [SPARK-1608] [SQL] Fix Cast.nullable when cast from StringType to NumericType/TimestampType.
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-04-26 14:39:54 -0700
+ Commit: dcea67f, github.com/apache/spark/pull/532
+
+ add note of how to support table with more than 22 fields
+ wangfei <wangfei1@huawei.com>
+ 2014-04-26 14:38:42 -0700
+ Commit: a020686, github.com/apache/spark/pull/564
+
+ [Spark-1382] Fix NPE in DStream.slice (updated version of #365)
+ zsxwing <zsxwing@gmail.com>, Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-25 19:04:34 -0700
+ Commit: f85c681, github.com/apache/spark/pull/562
+
+ SPARK-1632. Remove unnecessary boxing in compares in ExternalAppendOnlyM...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-25 17:55:04 -0700
+ Commit: 94c71e0, github.com/apache/spark/pull/559
+
+ SPARK-1235: manage the DAGScheduler EventProcessActor with supervisor and refactor the DAGScheduler with Akka
+ CodingCat <zhunansjtu@gmail.com>, Xiangrui Meng <meng@databricks.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-04-25 16:04:48 -0700
+ Commit: 5673c1e, github.com/apache/spark/pull/186
+
+ SPARK-1607. HOTFIX: Fix syntax adapting Int result to Short
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-25 14:17:38 -0700
+ Commit: 784b2a6, github.com/apache/spark/pull/556
+
+ Update KafkaWordCount.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-25 13:18:49 -0700
+ Commit: a0912a8, github.com/apache/spark/pull/523
+
+ Delete the val that never used
+ WangTao <barneystinson@aliyun.com>
+ 2014-04-25 11:47:01 -0700
+ Commit: 97bfeda, github.com/apache/spark/pull/553
+
+ SPARK-1621 Upgrade Chill to 0.3.6
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-25 11:12:41 -0700
+ Commit: 2c8dfd4, github.com/apache/spark/pull/543
+
+ SPARK-1619 Launch spark-shell with spark-submit
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-24 23:59:16 -0700
+ Commit: 8ba7f40, github.com/apache/spark/pull/542
+
+ SPARK-1607. Replace octal literals, removed in Scala 2.11, with hex literals
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-24 23:34:00 -0700
+ Commit: 7493ca9, github.com/apache/spark/pull/529
+
+ Call correct stop().
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-24 23:22:03 -0700
+ Commit: 3eba9bd, github.com/apache/spark/pull/527
+
+ SPARK-1242 Add aggregate to python rdd
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-24 23:07:54 -0700
+ Commit: f09a2c0, github.com/apache/spark/pull/139
+
+ Fix [SPARK-1078]: Remove the Unnecessary lift-json dependency
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-24 21:51:52 -0700
+ Commit: 496b9ae, github.com/apache/spark/pull/536
+
+ [Typo] In the maven docs: chd -> cdh
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-24 21:51:17 -0700
+ Commit: db69841, github.com/apache/spark/pull/548
+
+ Generalize pattern for planning hash joins.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 21:42:33 -0700
+ Commit: ab131ab, github.com/apache/spark/pull/418
+
+ [SPARK-1617] and [SPARK-1618] Improvements to streaming ui and bug fix to socket receiver
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 21:34:37 -0700
+ Commit: d933c71, github.com/apache/spark/pull/540
+
+ SPARK-1584: Upgrade Flume dependency to 1.4.0
+ tmalaska <ted.malaska@cloudera.com>
+ 2014-04-24 20:31:17 -0700
+ Commit: 777a9a5, github.com/apache/spark/pull/507
+
+ SPARK-1586 Windows build fixes
+ Mridul Muralidharan <mridulm80@apache.org>
+ 2014-04-24 20:48:33 -0700
+ Commit: 51a387a, github.com/apache/spark/pull/505
+
+ [SPARK-986]: Job cancelation for PySpark
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-04-24 20:21:10 -0700
+ Commit: 7b6d774, github.com/apache/spark/pull/541
+
+ [SPARK-1615] Synchronize accesses to the LiveListenerBus' event queue
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-24 20:18:15 -0700
+ Commit: 963046c, github.com/apache/spark/pull/544
+
+ [SPARK-1510] Spark Streaming metrics source for metrics system
+ jerryshao <saisai.shao@intel.com>, Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 18:56:57 -0700
+ Commit: 0bc0f36, github.com/apache/spark/pull/545
+
+ Spark 1489 Fix the HistoryServer view acls
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-24 18:38:10 -0700
+ Commit: c8dd132, github.com/apache/spark/pull/509
+
+ [SQL] Add support for parsing indexing into arrays in SQL.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 18:21:00 -0700
+ Commit: 2a35fba, github.com/apache/spark/pull/518
+
+ [SPARK-1592][streaming] Automatically remove streaming input blocks
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-24 18:18:22 -0700
+ Commit: a3b6d85, github.com/apache/spark/pull/512
+
+ SPARK-1438 RDD.sample() make seed param optional
+ Arun Ramakrishnan <smartnut007@gmail.com>
+ 2014-04-24 17:27:16 -0700
+ Commit: 521d435, github.com/apache/spark/pull/477
+
+ SPARK-1104: kill Process in workerThread of ExecutorRunner
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-24 15:55:18 -0700
+ Commit: a1f8779, github.com/apache/spark/pull/35
+
+ Fix Scala Style
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-24 15:07:23 -0700
+ Commit: 2250c7a, github.com/apache/spark/pull/531
+
+ SPARK-1494 Don't initialize classes loaded by MIMA excludes, attempt 2
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-24 14:54:01 -0700
+ Commit: 5ca01f6, github.com/apache/spark/pull/526
+
+ Spark 1490 Add kerberos support to the HistoryServer
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-24 11:15:12 -0700
+ Commit: 866b03e, github.com/apache/spark/pull/513
+
+ SPARK-1611: Fix incorrect initialization order in AppendOnlyMap
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-24 11:13:40 -0700
+ Commit: 00a3ccc, github.com/apache/spark/pull/534
+
+ SPARK-1488. Squash more language feature warnings in new commits by importing implicitConversion
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-24 10:06:18 -0700
+ Commit: 8d92d93, github.com/apache/spark/pull/528
+
+ Small changes to release script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-24 09:59:44 -0700
+ Commit: 563be2f
+
+ [SPARK-1610] [SQL] Fix Cast to use exact type value when cast from BooleanType to NumericTy...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-04-24 09:57:28 -0700
+ Commit: 8f8e051, github.com/apache/spark/pull/533
+
+ SPARK-1601 & SPARK-1602: two bug fixes related to cancellation
+ Reynold Xin <rxin@apache.org>
+ 2014-04-24 00:27:45 -0700
+ Commit: f98aac9, github.com/apache/spark/pull/521
+
+ SPARK-1587 Fix thread leak
+ Mridul Muralidharan <mridulm80@apache.org>
+ 2014-04-23 23:20:55 -0700
+ Commit: 8684a15, github.com/apache/spark/pull/504
+
+ [Fix #79] Replace Breakable For Loops By While Loops
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-23 22:47:59 -0700
+ Commit: e890771, github.com/apache/spark/pull/503
+
+ SPARK-1589: Fix the incorrect compare
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-23 22:36:02 -0700
+ Commit: 9716a72, github.com/apache/spark/pull/508
+
+ Mark all fields of EdgePartition, Graph, and GraphOps transient
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-23 22:01:13 -0700
+ Commit: bdd2691, github.com/apache/spark/pull/520
+
+ Update Java api for setJobGroup with interruptOnCancel
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 22:00:22 -0700
+ Commit: 36511ea, github.com/apache/spark/pull/522
+
+ [Hot Fix #469] Fix flaky test in SparkListenerSuite
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-23 21:59:33 -0700
+ Commit: 99c0c33, github.com/apache/spark/pull/516
+
+ [SPARK-1540] Add an optional Ordering parameter to PairRDDFunctions.
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-23 17:03:54 -0700
+ Commit: 31c7d83, github.com/apache/spark/pull/487
+
+ SPARK-1582 Invoke Thread.interrupt() when cancelling jobs
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 16:52:49 -0700
+ Commit: 55e6bea, github.com/apache/spark/pull/498
+
+ Honor default fs name when initializing event logger.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-23 14:47:38 -0700
+ Commit: 46b30f9, github.com/apache/spark/pull/450
+
+ SPARK-1572 Don't kill Executor if PythonRDD fails while computing parent
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-23 14:46:30 -0700
+ Commit: be8f26f, github.com/apache/spark/pull/486
+
+ SPARK-1583: Fix a bug that using java.util.HashMap by mistake
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-23 14:12:20 -0700
+ Commit: 19ef78f, github.com/apache/spark/pull/500
+
+ SPARK-1119 and other build improvements
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-23 10:19:32 -0700
+ Commit: d36d75c, github.com/apache/spark/pull/502
+
+ [SQL] SPARK-1571 Mistake in java example code
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 22:19:32 -0700
+ Commit: b0d8793, github.com/apache/spark/pull/496
+
+ SPARK-1494 Don't initialize classes loaded by MIMA excludes.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 21:56:15 -0700
+ Commit: 18b1867, github.com/apache/spark/pull/494
+
+ SPARK-1562 Fix visibility / annotation of Spark SQL APIs
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-22 20:02:33 -0700
+ Commit: 0e03e6a, github.com/apache/spark/pull/489
+
+ [FIX: SPARK-1376] use --arg instead of --args in SparkSubmit to avoid warning messages
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-22 19:38:27 -0700
+ Commit: 61930bd, github.com/apache/spark/pull/485
+
+ [streaming][SPARK-1578] Removed requirement for TTL in StreamingContext.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-22 19:35:13 -0700
+ Commit: bf47559, github.com/apache/spark/pull/491
+
+ [Spark-1538] Fix SparkUI incorrectly hiding persisted RDDs
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-22 19:24:03 -0700
+ Commit: 104590c, github.com/apache/spark/pull/469
+
+ Assorted clean-up for Spark-on-YARN.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-22 19:22:06 -0700
+ Commit: f764f47, github.com/apache/spark/pull/488
+
+ [SPARK-1570] Fix classloading in JavaSQLContext.applySchema
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-22 15:05:12 -0700
+ Commit: f9734e2, github.com/apache/spark/pull/484
+
+ Fix compilation on Hadoop 2.4.x.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-22 14:28:41 -0700
+ Commit: b6ba546, github.com/apache/spark/pull/483
+
+ [Fix #204] Eliminate delay between binding and log checking
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-22 14:27:49 -0700
+ Commit: 54c96c2, github.com/apache/spark/pull/441
+
+ [Fix #274] Document + fix annotation usages
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-21 22:24:44 -0700
+ Commit: 898fc34, github.com/apache/spark/pull/470
+
+ [HOTFIX] SPARK-1399: remove outdated comments
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-22 09:43:13 -0700
+ Commit: 61d7401, github.com/apache/spark/pull/474
+
+ [SPARK-1281] Improve partitioning in ALS
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-22 11:07:30 -0700
+ Commit: 4834adf, github.com/apache/spark/pull/407
+
+ fix bugs of dot in python
+ Xusen Yin <yinxusen@gmail.com>
+ 2014-04-22 11:06:18 -0700
+ Commit: 4f2f093, github.com/apache/spark/pull/463
+
+ [SPARK-1506][MLLIB] Documentation improvements for MLlib 1.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-22 11:20:47 -0700
+ Commit: 3f708f5, github.com/apache/spark/pull/422
+
+ [SPARK-1560]: Updated Pyrolite Dependency to be Java 6 compatible
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-04-22 09:44:41 -0700
+ Commit: 798d93f, github.com/apache/spark/pull/479
+
+ SPARK-1496: Have jarOfClass return Option[String]
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-22 00:42:16 -0700
+ Commit: 72aa131, github.com/apache/spark/pull/438
+
+ [SPARK-1459] Use local path (and not complete URL) when opening local lo...
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-21 23:10:53 -0700
+ Commit: 0a73103, github.com/apache/spark/pull/375
+
+ [SPARK-1439, SPARK-1440] Generate unified Scaladoc across projects and Javadocs
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-21 21:57:40 -0700
+ Commit: b0d70e4, github.com/apache/spark/pull/457
+
+ [SPARK-1332] Improve Spark Streaming's Network Receiver and InputDStream API [WIP]
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-21 19:04:49 -0700
+ Commit: 94cbe23, github.com/apache/spark/pull/300
+
+ Updating versions for Spark 1.0
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-21 16:59:38 -0700
+ Commit: a34e6fd
+
+ Dev script: include RC name in git tag
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-21 14:21:17 -0700
+ Commit: 1532af9
+
+ SPARK-1399: show stage failure reason in UI
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-04-21 14:10:23 -0700
+ Commit: 4b9220d, github.com/apache/spark/pull/421
+
+ SPARK-1539: RDDPage.scala contains RddPage class
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-21 12:48:02 -0700
+ Commit: 8aa3860, github.com/apache/spark/pull/454
+
+ [Hot Fix] Ignore org.apache.spark.ui.UISuite tests
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-21 12:37:43 -0700
+ Commit: d62ce6d, github.com/apache/spark/pull/466
+
+ REPL cleanup.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 17:32:24 -0700
+ Commit: 8e1e7ec, github.com/apache/spark/pull/451
+
+ Clean up and simplify Spark configuration
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-21 10:26:33 -0700
+ Commit: 29ee101, github.com/apache/spark/pull/299
+
+ [SPARK-1535] ALS: Avoid the garbage-creating ctor of DoubleMatrix
+ Tor Myklebust <tmyklebu@gmail.com>
+ 2014-04-19 15:10:18 -0700
+ Commit: 9ce6ed4, github.com/apache/spark/pull/442
+
+ Add insertInto and saveAsTable to Python API.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 15:08:54 -0700
+ Commit: 6ab0719, github.com/apache/spark/pull/447
+
+ Use scala deprecation instead of java.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-19 15:06:04 -0700
+ Commit: bfb09c6, github.com/apache/spark/pull/452
+
+ README update
+ Reynold Xin <rxin@apache.org>
+ 2014-04-18 22:34:39 -0700
+ Commit: 2fe6b18, github.com/apache/spark/pull/443
+
+ SPARK-1482: Fix potential resource leaks in saveAsHadoopDataset and save...
+ zsxwing <zsxwing@gmail.com>
+ 2014-04-18 17:49:22 -0700
+ Commit: ea17460, github.com/apache/spark/pull/400
+
+ SPARK-1456 Remove view bounds on Ordered in favor of a context bound on Ordering.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-18 12:04:13 -0700
+ Commit: 9e21b97, github.com/apache/spark/pull/410
+
+ Fixed broken pyspark shell.
+ Reynold Xin <rxin@apache.org>
+ 2014-04-18 10:10:13 -0700
+ Commit: d8767c4, github.com/apache/spark/pull/444
+
+ SPARK-1523: improve the readability of code in AkkaUtil
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-18 10:05:00 -0700
+ Commit: 171cea8, github.com/apache/spark/pull/434
+
+ SPARK-1357 (addendum). More Experimental items in MLlib
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-18 10:04:02 -0700
+ Commit: 1a30429, github.com/apache/spark/pull/372
+
+ [SPARK-1520] remove fastutil from dependencies
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-18 10:03:15 -0700
+ Commit: c40eec8, github.com/apache/spark/pull/437
+
+ Reuses Row object in ExistingRdd.productToRowRdd()
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-18 10:02:27 -0700
+ Commit: 977467e, github.com/apache/spark/pull/432
+
+ SPARK-1483: Rename minSplits to minPartitions in public APIs
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-04-18 10:01:16 -0700
+ Commit: 969a075, github.com/apache/spark/pull/430
+
+ HOTFIX: Ignore streaming UI test
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-17 17:33:24 -0700
+ Commit: 1c0dc37, github.com/apache/spark/pull/440
+
+ FIX: Don't build Hive in assembly unless running Hive tests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-17 17:24:00 -0700
+ Commit: 3225272, github.com/apache/spark/pull/439
+
+ Add clean to build
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-16 16:32:34 -0700
+ Commit: 67d01d8
+
+ HOTFIX: Use file name and not paths for excludes
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-14 15:51:54 -0700
+ Commit: 5349fab
+
+ SPARK-1408 Modify Spark on Yarn to point to the history server when app ...
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-17 16:36:37 -0500
+ Commit: 6195fb8, github.com/apache/spark/pull/362
+
+ [SPARK-1395] Allow "local:" URIs to work on Yarn.
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-17 10:29:38 -0500
+ Commit: a83a794, github.com/apache/spark/pull/303
+
+ [python alternative] pyspark require Python2, failing if system default is Py3 from shell.py
+ AbhishekKr <abhikumar163@gmail.com>
+ 2014-04-16 19:05:40 -0700
+ Commit: b3ad707, github.com/apache/spark/pull/399
+
+ SPARK-1462: Examples of ML algorithms are using deprecated APIs
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-16 18:23:07 -0700
+ Commit: 13fb4c7, github.com/apache/spark/pull/416
+
+ Include stack trace for exceptions thrown by user code.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-16 18:12:56 -0700
+ Commit: aef8a4a, github.com/apache/spark/pull/409
+
+ Update ReducedWindowedDStream.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-16 18:08:11 -0700
+ Commit: 822353d, github.com/apache/spark/pull/425
+
+ misleading task number of groupByKey
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 17:58:42 -0700
+ Commit: 51c41da, github.com/apache/spark/pull/403
+
+ Fixing a race condition in event listener unit test
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-16 17:39:11 -0700
+ Commit: f0abf5f, github.com/apache/spark/pull/401
+
+ remove unnecessary brace and semicolon in 'putBlockInfo.synchronize' block
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 17:30:01 -0700
+ Commit: e43e31d, github.com/apache/spark/pull/411
+
+ SPARK-1329: Create pid2vid with correct number of partitions
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-16 17:16:55 -0700
+ Commit: b4ea3d9, github.com/apache/spark/pull/368
+
+ Rebuild routing table after Graph.reverse
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-04-16 17:15:50 -0700
+ Commit: 602b9ea, github.com/apache/spark/pull/431
+
+ [SPARK-1511] use Files.move instead of renameTo in TestUtils.scala
+ Ye Xianjin <advancedxy@gmail.com>
+ 2014-04-16 14:56:22 -0700
+ Commit: 87a7c4f, github.com/apache/spark/pull/427
+
+ SPARK-1465: Spark compilation is broken with the latest hadoop-2.4.0 release
+ xuan <xuan@MacBook-Pro.local>, xuan <xuan@macbook-pro.home>
+ 2014-04-16 14:41:22 -0500
+ Commit: d8fc4a4, github.com/apache/spark/pull/396
+
+ SPARK-1469: Scheduler mode should accept lower-case definitions and have...
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-16 09:58:57 -0700
+ Commit: b75301f, github.com/apache/spark/pull/388
+
+ Minor addition to SPARK-1497
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-16 09:43:17 -0700
+ Commit: 4479ecd
+
+ SPARK-1497. Fix scalastyle warnings in YARN, Hive code
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-16 09:34:59 -0700
+ Commit: c744d66, github.com/apache/spark/pull/413
+
+ SPARK-1310: Start adding k-fold cross validation to MLLib [adds kFold to MLUtils & fixes bug in BernoulliSampler]
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-16 09:33:27 -0700
+ Commit: 8efec04, github.com/apache/spark/pull/18
+
+ update spark.default.parallelism
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-04-16 09:14:18 -0700
+ Commit: e4f5577, github.com/apache/spark/pull/389
+
+ Loads test tables when running "sbt hive/console" without HIVE_DEV_HOME
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-16 08:54:34 -0700
+ Commit: 9e908ab, github.com/apache/spark/pull/417
+
+ Make "spark logo" link refer to "/".
+ Marcelo Vanzin <vanzin@cloudera.com>
+ 2014-04-16 08:53:01 -0700
+ Commit: 5fe18a7, github.com/apache/spark/pull/408
+
+ [SPARK-959] Updated SBT from 0.13.1 to 0.13.2
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-16 08:52:14 -0700
+ Commit: 1ea9a21, github.com/apache/spark/pull/426
+
+ [SQL] SPARK-1424 Generalize insertIntoTable functions on SchemaRDDs
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-15 20:40:40 -0700
+ Commit: e5130d9, github.com/apache/spark/pull/354
+
+ [WIP] SPARK-1430: Support sparse data in Python MLlib
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-15 20:33:24 -0700
+ Commit: 95647fa, github.com/apache/spark/pull/341
+
+ [FIX] update sbt-idea to version 1.6.0
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-15 19:37:32 -0700
+ Commit: 33d6e37, github.com/apache/spark/pull/419
+
+ SPARK-1455: Better isolation for unit tests.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-15 19:34:39 -0700
+ Commit: 110e825, github.com/apache/spark/pull/420
+
+ Decision Tree documentation for MLlib programming guide
+ Manish Amde <manish9ue@gmail.com>
+ 2014-04-15 11:14:28 -0700
+ Commit: 194ed06, github.com/apache/spark/pull/402
+
+ [SPARK-1157][MLlib] L-BFGS Optimizer based on Breeze's implementation.
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-04-15 11:12:47 -0700
+ Commit: 5812472, github.com/apache/spark/pull/353
+
+ SPARK-1501: Ensure assertions in Graph.apply are asserted.
+ William Benton <willb@redhat.com>
+ 2014-04-15 10:38:42 -0700
+ Commit: 692dd69, github.com/apache/spark/pull/415
+
+ SPARK-1426: Make MLlib work with NumPy versions older than 1.7
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-15 00:19:43 -0700
+ Commit: 1491b2a, github.com/apache/spark/pull/391
+
+ SPARK-1374: PySpark API for SparkSQL
+ Ahir Reddy <ahirreddy@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-04-15 00:07:55 -0700
+ Commit: 7433f64, github.com/apache/spark/pull/363
+
+ SPARK-1488. Resolve scalac feature warnings during build
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-14 19:50:00 -0700
+ Commit: 7471828, github.com/apache/spark/pull/404
+
+ [BUGFIX] In-memory columnar storage bug fixes
+ Cheng Lian <lian.cs.zju@gmail.com>, Michael Armbrust <michael@databricks.com>
+ 2014-04-14 15:22:43 -0700
+ Commit: fdebb69, github.com/apache/spark/pull/374
+
+ [SPARK-1415] Hadoop min split for wholeTextFiles()
+ Xusen Yin <yinxusen@gmail.com>
+ 2014-04-13 13:18:52 -0700
+ Commit: 1cf565f, github.com/apache/spark/pull/376
+
+ SPARK-1480: Clean up use of classloaders
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-13 08:58:37 -0700
+ Commit: 3537e25, github.com/apache/spark/pull/398
+
+ [SPARK-1403] Move the class loader creation back to where it was in 0.9.0
+ Bharath Bhushan <manku.timma@outlook.com>
+ 2014-04-12 20:52:29 -0700
+ Commit: c970d86, github.com/apache/spark/pull/322
+
+ [Fix #204] Update out-dated comments
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-12 16:33:38 -0700
+ Commit: 52d401b, github.com/apache/spark/pull/381
+
+ [SPARK-1386] Web UI for Spark Streaming
+ Tathagata Das <tathagata.das1565@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-04-11 23:33:49 -0700
+ Commit: f36dc3f, github.com/apache/spark/pull/290
+
+ SPARK-1057 (alternative) Remove fastutil
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-11 22:46:47 -0700
+ Commit: 4dfcb38, github.com/apache/spark/pull/266
+
+ Update WindowedDStream.scala
+ baishuo(白硕) <vc_java@hotmail.com>
+ 2014-04-11 20:33:42 -0700
+ Commit: dac6240, github.com/apache/spark/pull/390
+
+ [WIP] [SPARK-1328] Add vector statistics
+ Xusen Yin <yinxusen@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 19:43:22 -0700
+ Commit: ce0ce3d, github.com/apache/spark/pull/268
+
+ [FIX] make coalesce test deterministic in RDDSuite
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 19:41:40 -0700
+ Commit: 9afaeed, github.com/apache/spark/pull/387
+
+ HOTFIX: Ignore python metastore files in RAT checks.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-11 13:23:21 -0700
+ Commit: 79eb276, github.com/apache/spark/pull/393
+
+ [SPARK-1225, 1241] [MLLIB] Add AreaUnderCurve and BinaryClassificationMetrics
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-11 12:06:13 -0700
+ Commit: e6128b5, github.com/apache/spark/pull/364
+
+ Some clean up in build/docs
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-11 10:45:27 -0700
+ Commit: 170b09d, github.com/apache/spark/pull/382
+
+ SPARK-1417: Spark on Yarn - spark UI link from resourcemanager is broken
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-11 13:17:48 +0530
+ Commit: 9e90c46, github.com/apache/spark/pull/344
+
+ SPARK-1202: Improvements to task killing in the UI.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-10 20:43:56 -0700
+ Commit: a1bb4c6, github.com/apache/spark/pull/386
+
+ Add Spark v0.9.1 to ec2 launch script and use it as the default
+ Harvey Feng <hyfeng224@gmail.com>
+ 2014-04-10 18:25:54 -0700
+ Commit: 59de39b, github.com/apache/spark/pull/385
+
+ Set spark.executor.uri from environment variable (needed by Mesos)
+ Ivan Wick <ivanwick+github@gmail.com>
+ 2014-04-10 17:49:30 -0700
+ Commit: 41df293, github.com/apache/spark/pull/311
+
+ SPARK-1202 - Add a "cancel" button in the UI for stages
+ Sundeep Narravula <sundeepn@superduel.local>, Sundeep Narravula <sundeepn@dhcpx-204-110.corp.yahoo.com>
+ 2014-04-10 17:10:11 -0700
+ Commit: 211f974, github.com/apache/spark/pull/246
+
+ [SQL] Improve column pruning in the optimizer.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-10 16:20:33 -0700
+ Commit: 4843ef0, github.com/apache/spark/pull/378
+
+ Remove Unnecessary Whitespace's
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-10 15:04:13 -0700
+ Commit: 09bf14b, github.com/apache/spark/pull/380
+
+ Update tuning.md
+ Andrew Ash <andrew@andrewash.com>
+ 2014-04-10 14:59:58 -0700
+ Commit: 4c9906d, github.com/apache/spark/pull/384
+
+ Revert "SPARK-1433: Upgrade Mesos dependency to 0.17.0"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-10 14:43:29 -0700
+ Commit: 1e2cdbc
+
+ SPARK-1428: MLlib should convert non-float64 NumPy arrays to float64 instead of complaining
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-10 11:17:41 -0700
+ Commit: 2ac43ad, github.com/apache/spark/pull/356
+
+ [SPARK-1276] Add a HistoryServer to render persisted UI
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-10 10:39:34 -0700
+ Commit: 9ae80bf, github.com/apache/spark/pull/204
+
+ Fix SPARK-1413: Parquet messes up stdout and stdin when used in Spark REPL
+ witgo <witgo@qq.com>
+ 2014-04-10 10:35:24 -0700
+ Commit: a74fbbb, github.com/apache/spark/pull/325
+
+ Revert "SPARK-729: Closures not always serialized at capture time"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-10 02:10:40 -0700
+ Commit: e6d4a74
+
+ SPARK-1446: Spark examples should not do a System.exit
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-10 00:37:21 -0700
+ Commit: e55cc4b, github.com/apache/spark/pull/370
+
+ SPARK-729: Closures not always serialized at capture time
+ William Benton <willb@redhat.com>
+ 2014-04-09 18:56:27 -0700
+ Commit: 8ca3b2b, github.com/apache/spark/pull/189
+
+ [SPARK-1357 (fix)] remove empty line after :: DeveloperApi/Experimental ::
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-09 17:08:17 -0700
+ Commit: 0adc932, github.com/apache/spark/pull/373
+
+ SPARK-1407 drain event queue before stopping event logger
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-09 15:24:33 -0700
+ Commit: eb5f2b6, github.com/apache/spark/pull/366
+
+ [SPARK-1357] [MLLIB] Annotate developer and experimental APIs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-09 02:21:15 -0700
+ Commit: bde9cc1, github.com/apache/spark/pull/298
+
+ SPARK-1093: Annotate developer and experimental API's
+ Patrick Wendell <pwendell@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-04-09 01:14:46 -0700
+ Commit: 87bd1f9, github.com/apache/spark/pull/274
+
+ [SPARK-1390] Refactoring of matrices backed by RDDs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-08 23:01:15 -0700
+ Commit: 9689b66, github.com/apache/spark/pull/296
+
+ Spark-939: allow user jars to take precedence over spark jars
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-08 22:29:21 -0700
+ Commit: fa0524f, github.com/apache/spark/pull/217
+
+ [SPARK-1434] [MLLIB] change labelParser from anonymous function to trait
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-08 20:37:01 -0700
+ Commit: b9e0c93, github.com/apache/spark/pull/345
+
+ Spark 1271: Co-Group and Group-By should pass Iterable[X]
+ Holden Karau <holden@pigscanfly.ca>
+ 2014-04-08 18:15:52 -0700
+ Commit: ce8ec54, github.com/apache/spark/pull/242
+
+ SPARK-1433: Upgrade Mesos dependency to 0.17.0
+ Sandeep <sandeep@techaddict.me>
+ 2014-04-08 16:19:22 -0700
+ Commit: 12c077d, github.com/apache/spark/pull/355
+
+ [SPARK-1397] Notify SparkListeners when stages fail or are cancelled.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-04-08 14:42:02 -0700
+ Commit: fac6085, github.com/apache/spark/pull/309
+
+ SPARK-1445: compute-classpath should not print error if lib_managed not found
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-08 14:40:20 -0700
+ Commit: e25b593, github.com/apache/spark/pull/361
+
+ SPARK-1348 binding Master, Worker, and App Web UI to all interfaces
+ Kan Zhang <kzhang@apache.org>
+ 2014-04-08 14:30:24 -0700
+ Commit: a8d86b0, github.com/apache/spark/pull/318
+
+ Remove extra semicolon in import statement and unused import in ApplicationMaster
+ Henry Saputra <hsaputra@apache.org>
+ 2014-04-08 14:23:16 -0700
+ Commit: 3bc0548, github.com/apache/spark/pull/358
+
+ [SPARK-1396] Properly cleanup DAGScheduler on job cancellation.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-04-08 01:03:33 -0700
+ Commit: 6dc5f58, github.com/apache/spark/pull/305
+
+ [SPARK-1331] Added graceful shutdown to Spark Streaming
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-04-08 00:00:17 -0700
+ Commit: 83ac9a4, github.com/apache/spark/pull/247
+
+ [SPARK-1103] Automatic garbage collection of RDD, shuffle and broadcast data
+ Tathagata Das <tathagata.das1565@gmail.com>, Andrew Or <andrewor14@gmail.com>, Roman Pastukhov <ignatich@mail.ru>
+ 2014-04-07 23:40:21 -0700
+ Commit: 11eabbe, github.com/apache/spark/pull/126
+
+ [SPARK-1402] Added 3 more compression schemes
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-07 22:24:12 -0700
+ Commit: 0d0493f, github.com/apache/spark/pull/330
+
+ Change timestamp cast semantics. When cast to numeric types, return the unix time in seconds (instead of millis).
+ Reynold Xin <rxin@apache.org>
+ 2014-04-07 19:28:24 -0700
+ Commit: f27e56a, github.com/apache/spark/pull/352
+
+ Added eval for Rand (without any support for user-defined seed).
+ Reynold Xin <rxin@apache.org>
+ 2014-04-07 18:40:08 -0700
+ Commit: 31e6fff, github.com/apache/spark/pull/349
+
+ Removed the default eval implementation from Expression, and added a bunch of override's in classes I touched.
+ Reynold Xin <rxin@apache.org>
+ 2014-04-07 18:39:18 -0700
+ Commit: 55dfd5d, github.com/apache/spark/pull/350
+
+ [sql] Rename execution/aggregates.scala Aggregate.scala, and added a bunch of private[this] to variables.
+ Reynold Xin <rxin@apache.org>
+ 2014-04-07 18:38:44 -0700
+ Commit: 14c9238, github.com/apache/spark/pull/348
+
+ SPARK-1099: Introduce local[*] mode to infer number of cores
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-07 13:06:30 -0700
+ Commit: 0307db0, github.com/apache/spark/pull/182
+
+ HOTFIX: Disable actor input stream test.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-07 12:47:27 -0700
+ Commit: 2a2ca48, github.com/apache/spark/pull/347
+
+ SPARK-1252. On YARN, use container-log4j.properties for executors
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-07 13:28:14 -0500
+ Commit: 9dd8b91, github.com/apache/spark/pull/148
+
+ [sql] Rename Expression.apply to eval for better readability.
+ Reynold Xin <rxin@apache.org>
+ 2014-04-07 10:45:31 -0700
+ Commit: 83f2a2f, github.com/apache/spark/pull/340
+
+ SPARK-1432: Make sure that all metadata fields are properly cleaned
+ Davis Shepherd <davis@conviva.com>
+ 2014-04-07 10:02:00 -0700
+ Commit: a3c51c6, github.com/apache/spark/pull/338
+
+ [SQL] SPARK-1427 Fix toString for SchemaRDD NativeCommands.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-07 01:46:50 -0700
+ Commit: b5bae84, github.com/apache/spark/pull/343
+
+ [SQL] SPARK-1371 Hash Aggregation Improvements
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-07 00:14:00 -0700
+ Commit: accd099, github.com/apache/spark/pull/295
+
+ SPARK-1431: Allow merging conflicting pull requests
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-06 21:04:45 -0700
+ Commit: 87d0928, github.com/apache/spark/pull/342
+
+ SPARK-1154: Clean up app folders in worker nodes
+ Evan Chan <ev@ooyala.com>, Kelvin Chu <kelvinkwchu@yahoo.com>
+ 2014-04-06 19:17:33 -0700
+ Commit: 1440154, github.com/apache/spark/pull/288
+
+ SPARK-1314: Use SPARK_HIVE to determine if we include Hive in packaging
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-06 17:48:41 -0700
+ Commit: 4106558, github.com/apache/spark/pull/237
+
+ SPARK-1349: spark-shell gets its own command history
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-06 17:43:44 -0700
+ Commit: 7ce52c4, github.com/apache/spark/pull/267
+
+ SPARK-1387. Update build plugins, avoid plugin version warning, centralize versions
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-06 17:40:37 -0700
+ Commit: 856c50f, github.com/apache/spark/pull/291
+
+ [SPARK-1259] Make RDD locally iterable
+ Egor Pakhomov <pahomov.egor@gmail.com>
+ 2014-04-06 16:41:23 -0700
+ Commit: e258e50, github.com/apache/spark/pull/156
+
+ Fix SPARK-1420 The maven build error for Spark Catalyst
+ witgo <witgo@qq.com>
+ 2014-04-06 16:03:06 -0700
+ Commit: 7012ffa, github.com/apache/spark/pull/333
+
+ SPARK-1421. Make MLlib work on Python 2.6
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-05 20:52:05 -0700
+ Commit: 0b85516, github.com/apache/spark/pull/335
+
+ Fix for PR #195 for Java 6
+ Sean Owen <sowen@cloudera.com>
+ 2014-04-05 19:08:24 -0700
+ Commit: 890d63b, github.com/apache/spark/pull/334
+
+ [SPARK-1371] fix computePreferredLocations signature to not depend on underlying implementation
+ Mridul Muralidharan <mridulm80@apache.org>
+ 2014-04-05 15:23:37 -0700
+ Commit: 6e88583, github.com/apache/spark/pull/302
+
+ Remove the getStageInfo() method from SparkContext.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-04-05 15:17:50 -0700
+ Commit: 2d0150c, github.com/apache/spark/pull/308
+
+ HOTFIX for broken CI, by SPARK-1336
+ Prashant Sharma <prashant.s@imaginea.com>, Prashant Sharma <scrapcodes@gmail.com>
+ 2014-04-04 22:49:19 -0700
+ Commit: 7c18428, github.com/apache/spark/pull/321
+
+ small fix ( proogram -> program )
+ Prabeesh K <prabsmails@gmail.com>
+ 2014-04-04 21:32:00 -0700
+ Commit: 0acc7a0, github.com/apache/spark/pull/331
+
+ [SQL] SPARK-1366 Consistent sql function across different types of SQLContexts
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-04 21:15:33 -0700
+ Commit: 8de038e, github.com/apache/spark/pull/319
+
+ SPARK-1305: Support persisting RDD's directly to Tachyon
+ Haoyuan Li <haoyuan@cs.berkeley.edu>, RongGu <gurongwalker@gmail.com>
+ 2014-04-04 20:36:24 -0700
+ Commit: b50ddfd, github.com/apache/spark/pull/158
+
+ [SPARK-1419] Bumped parent POM to apache 14
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-04-04 19:19:48 -0700
+ Commit: 1347ebd, github.com/apache/spark/pull/328
+
+ Add test utility for generating Jar files with compiled classes.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-04 19:15:15 -0700
+ Commit: 5f3c1bb, github.com/apache/spark/pull/326
+
+ SPARK-1414. Python API for SparkContext.wholeTextFiles
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-04 17:29:29 -0700
+ Commit: 60e18ce, github.com/apache/spark/pull/327
+
+ [SQL] Minor fixes.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-04 17:23:17 -0700
+ Commit: d956cc2, github.com/apache/spark/pull/315
+
+ [SPARK-1198] Allow pipes tasks to run in different sub-directories
+ Thomas Graves <tgraves@apache.org>
+ 2014-04-04 17:16:31 -0700
+ Commit: 198892f, github.com/apache/spark/pull/128
+
+ Don't create SparkContext in JobProgressListenerSuite.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-04 14:46:32 -0700
+ Commit: a02b535, github.com/apache/spark/pull/324
+
+ SPARK-1375. Additional spark-submit cleanup
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-04 13:28:42 -0700
+ Commit: 16b8308, github.com/apache/spark/pull/278
+
+ [SPARK-1133] Add whole text files reader in MLlib
+ Xusen Yin <yinxusen@gmail.com>
+ 2014-04-04 11:12:47 -0700
+ Commit: f1fa617, github.com/apache/spark/pull/252
+
+ SPARK-1404: Always upgrade spark-env.sh vars to environment vars
+ Aaron Davidson <aaron@databricks.com>
+ 2014-04-04 09:50:24 -0700
+ Commit: 01cf4c4, github.com/apache/spark/pull/310
+
+ SPARK-1350. Always use JAVA_HOME to run executor container JVMs.
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-04 08:54:04 -0500
+ Commit: 7f32fd4, github.com/apache/spark/pull/313
+
+ SPARK-1337: Application web UI garbage collects newest stages
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-03 22:13:56 -0700
+ Commit: ee6e9e7, github.com/apache/spark/pull/320
+
+ Revert "[SPARK-1398] Removed findbugs jsr305 dependency"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-04-03 17:00:06 -0700
+ Commit: 33e6361
+
+ Fix jenkins from giving the green light to builds that don't compile.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-03 16:53:35 -0700
+ Commit: 9231b01, github.com/apache/spark/pull/317
+
+ [BUILD FIX] Fix compilation of Spark SQL Java API.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-03 16:12:08 -0700
+ Commit: d94826b, github.com/apache/spark/pull/316
+
+ [SPARK-1134] Fix and document passing of arguments to IPython
+ Diana Carroll <dcarroll@cloudera.com>
+ 2014-04-03 15:48:42 -0700
+ Commit: a599e43, github.com/apache/spark/pull/294
+
+ [SQL] SPARK-1333 First draft of java API
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-03 15:45:34 -0700
+ Commit: b8f5341, github.com/apache/spark/pull/248
+
+ Spark 1162 Implemented takeOrdered in pyspark.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-04-03 15:42:17 -0700
+ Commit: c1ea3af, github.com/apache/spark/pull/97
+
+ [SPARK-1360] Add Timestamp Support for SQL
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-04-03 15:33:17 -0700
+ Commit: 5d1feda, github.com/apache/spark/pull/275
+
+ Spark parquet improvements
+ Andre Schumacher <andre.schumacher@iki.fi>
+ 2014-04-03 15:31:47 -0700
+ Commit: fbebaed, github.com/apache/spark/pull/195
+
+ [SPARK-1398] Removed findbugs jsr305 dependency
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-04-03 14:08:47 -0700
+ Commit: 92a86b2, github.com/apache/spark/pull/307
+
+ [SQL] SPARK-1364 Improve datatype and test coverage for ScalaReflection schema inference.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-02 18:14:31 -0700
+ Commit: 47ebea5, github.com/apache/spark/pull/293
+
+ [SPARK-1212, Part II] Support sparse data in MLlib
+ Xiangrui Meng <meng@databricks.com>
+ 2014-04-02 14:01:12 -0700
+ Commit: 9c65fa7, github.com/apache/spark/pull/245
+
+ StopAfter / TopK related changes
+ Reynold Xin <rxin@apache.org>, Michael Armbrust <michael@databricks.com>
+ 2014-04-02 12:48:04 -0700
+ Commit: ed730c9, github.com/apache/spark/pull/233
+
+ [SPARK-1371][WIP] Compression support for Spark SQL in-memory columnar storage
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-04-02 12:47:22 -0700
+ Commit: 1faa579, github.com/apache/spark/pull/285
+
+ Do not re-use objects in the EdgePartition/EdgeTriplet iterators.
+ Daniel Darabos <darabos.daniel@gmail.com>
+ 2014-04-02 12:27:37 -0700
+ Commit: 7823633, github.com/apache/spark/pull/276
+
+ [SPARK-1385] Use existing code for JSON de/serialization of BlockId
+ Andrew Or <andrewor14@gmail.com>
+ 2014-04-02 10:43:09 -0700
+ Commit: de8eefa, github.com/apache/spark/pull/289
+
+ Renamed stageIdToActiveJob to jobIdToActiveJob.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-04-02 10:35:52 -0700
+ Commit: 11973a7, github.com/apache/spark/pull/301
+
+ Remove * from test case golden filename.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-01 23:54:38 -0700
+ Commit: ea9de65, github.com/apache/spark/pull/297
+
+ MLI-1 Decision Trees
+ Manish Amde <manish9ue@gmail.com>, manishamde <manish9ue@gmail.com>, Xiangrui Meng <meng@databricks.com>
+ 2014-04-01 21:40:49 -0700
+ Commit: 8b3045c, github.com/apache/spark/pull/79
+
+ Revert "[Spark-1134] only call ipython if no arguments are given; remove IPYTHONOPTS from call"
+ Matei Zaharia <matei@databricks.com>
+ 2014-04-01 19:31:50 -0700
+ Commit: 45df912
+
+ [Spark-1134] only call ipython if no arguments are given; remove IPYTHONOPTS from call
+ Diana Carroll <dcarroll@cloudera.com>
+ 2014-04-01 19:29:26 -0700
+ Commit: afb5ea6, github.com/apache/spark/pull/227
+
+ [SPARK-1342] Scala 2.10.4
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-04-01 18:35:50 -0700
+ Commit: 764353d, github.com/apache/spark/pull/259
+
+ [SQL] SPARK-1372 Support for caching and uncaching tables in a SQLContext.
+ Michael Armbrust <michael@databricks.com>
+ 2014-04-01 14:45:44 -0700
+ Commit: f5c418d, github.com/apache/spark/pull/282
+
+ [Hot Fix #42] Persisted RDD disappears on storage page if re-used
+ Andrew Or <andrewor14@gmail.com>
+ 2014-03-31 23:01:14 -0700
+ Commit: ada310a, github.com/apache/spark/pull/281
+
+ [SPARK-1377] Upgrade Jetty to 8.1.14v20131031
+ Andrew Or <andrewor14@gmail.com>
+ 2014-03-31 21:42:36 -0700
+ Commit: 94fe7fd, github.com/apache/spark/pull/280
+
+ SPARK-1376. In the yarn-cluster submitter, rename "args" option to "arg"
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-04-01 08:26:31 +0530
+ Commit: 564f1c1, github.com/apache/spark/pull/279
+
+ SPARK-1365 [HOTFIX] Fix RateLimitedOutputStream test
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-31 16:25:43 -0700
+ Commit: 33b3c2a, github.com/apache/spark/pull/277
+
+ [SQL] Rewrite join implementation to allow streaming of one relation.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-31 15:23:46 -0700
+ Commit: 5731af5, github.com/apache/spark/pull/250
+
+ SPARK-1352: Improve robustness of spark-submit script
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-31 12:07:14 -0700
+ Commit: 841721e, github.com/apache/spark/pull/271
+
+ SPARK-1352 - Comment style single space before ending */ check.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-30 10:06:56 -0700
+ Commit: d666053, github.com/apache/spark/pull/261
+
+ [SPARK-1354][SQL] Add tableName as a qualifier for SimpleCatelogy
+ jerryshao <saisai.shao@intel.com>
+ 2014-03-30 10:03:58 -0700
+ Commit: 95d7d2a, github.com/apache/spark/pull/272
+
+ SPARK-1336 Reducing the output of run-tests script.
+ Prashant Sharma <prashant.s@imaginea.com>, Prashant Sharma <scrapcodes@gmail.com>
+ 2014-03-29 23:03:03 -0700
+ Commit: df1b9f7, github.com/apache/spark/pull/262
+
+ [SQL] SPARK-1354 Fix self-joins of parquet relations
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-29 22:02:53 -0700
+ Commit: 2861b07, github.com/apache/spark/pull/269
+
+ Don't swallow all kryo errors, only those that indicate we are out of data.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-29 22:01:29 -0700
+ Commit: 92b8395, github.com/apache/spark/pull/142
+
+ [SPARK-1186] : Enrich the Spark Shell to support additional arguments.
+ Bernardo Gomez Palacio <bernardo.gomezpalacio@gmail.com>
+ 2014-03-29 19:49:22 -0700
+ Commit: fda86d8, github.com/apache/spark/pull/116
+
+ Implement the RLike & Like in catalyst
+ Cheng Hao <hao.cheng@intel.com>
+ 2014-03-29 15:12:43 -0700
+ Commit: af3746c, github.com/apache/spark/pull/224
+
+ SPARK-1126. spark-app preliminary
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-29 14:41:36 -0700
+ Commit: 1617816, github.com/apache/spark/pull/86
+
+ SPARK-1345 adding missing dependency on avro for hadoop 0.23 to the new ...
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-28 23:09:29 -0700
+ Commit: 3738f24, github.com/apache/spark/pull/263
+
+ fix path for jar, make sed actually work on OSX
+ Nick Lanham <nick@afternight.org>
+ 2014-03-28 13:33:35 -0700
+ Commit: 75d46be, github.com/apache/spark/pull/264
+
+ SPARK-1096, a space after comment start style checker.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-28 00:21:49 -0700
+ Commit: 60abc25, github.com/apache/spark/pull/124
+
+ Make sed do -i '' on OSX
+ Nick Lanham <nick@afternight.org>
+ 2014-03-27 22:45:00 -0700
+ Commit: 632c322, github.com/apache/spark/pull/258
+
+ [SPARK-1210] Prevent ContextClassLoader of Actor from becoming ClassLoader of Executo...
+ Takuya UESHIN <ueshin@happy-camper.st>
+ 2014-03-27 22:17:15 -0700
+ Commit: 3d89043, github.com/apache/spark/pull/15
+
+ [SPARK-1268] Adding XOR and AND-NOT operations to spark.util.collection.BitSet
+ Petko Nikolov <nikolov@soundcloud.com>
+ 2014-03-27 15:49:07 -0700
+ Commit: 6f986f0, github.com/apache/spark/pull/172
+
+ SPARK-1335. Also increase perm gen / code cache for scalatest when invoked via Maven build
+ Sean Owen <sowen@cloudera.com>
+ 2014-03-27 11:49:11 -0700
+ Commit: 53953d0, github.com/apache/spark/pull/253
+
+ SPARK-1330 removed extra echo from comput_classpath.sh
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-27 11:54:43 -0500
+ Commit: 426042a, github.com/apache/spark/pull/241
+
+ Cut down the granularity of travis tests.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-27 08:53:42 -0700
+ Commit: 5b2d863, github.com/apache/spark/pull/255
+
+ [SPARK-1327] GLM needs to check addIntercept for intercept and weights
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-26 19:30:20 -0700
+ Commit: d679843, github.com/apache/spark/pull/236
+
+ SPARK-1325. The maven build error for Spark Tools
+ Sean Owen <sowen@cloudera.com>, witgo <witgo@qq.com>
+ 2014-03-26 18:31:52 -0700
+ Commit: 1fa48d9, github.com/apache/spark/pull/240
+
+ Spark 1095 : Adding explicit return types to all public methods
+ NirmalReddy <nirmal_reddy2000@yahoo.com>, NirmalReddy <nirmal.reddy@imaginea.com>
+ 2014-03-26 18:24:55 -0700
+ Commit: 3e63d98, github.com/apache/spark/pull/168
+
+ SPARK-1324: SparkUI Should Not Bind to SPARK_PUBLIC_DNS
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-26 18:22:15 -0700
+ Commit: be6d96c, github.com/apache/spark/pull/231
+
+ [SQL] Add a custom serializer for maps since they do not have a no-arg constructor.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-26 18:19:49 -0700
+ Commit: e15e574, github.com/apache/spark/pull/243
+
+ [SQL] Un-ignore a test that is now passing.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-26 18:19:15 -0700
+ Commit: 32cbdfd, github.com/apache/spark/pull/244
+
+ Unified package definition format in Spark SQL
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-03-26 15:36:18 -0700
+ Commit: 345825d, github.com/apache/spark/pull/225
+
+ SPARK-1322, top in pyspark should sort result in descending order.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-26 09:16:37 -0700
+ Commit: a0853a3, github.com/apache/spark/pull/235
+
+ SPARK-1321 Use Guava's top k implementation rather than our BoundedPriorityQueue based implementation
+ Reynold Xin <rxin@apache.org>
+ 2014-03-26 00:09:44 -0700
+ Commit: b859853, github.com/apache/spark/pull/229
+
+ Initial experimentation with Travis CI configuration
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-25 19:01:18 -0700
+ Commit: 4f7d547, github.com/apache/spark/pull/230
+
+ Avoid Option while generating call site
+ witgo <witgo@qq.com>, Aaron Davidson <aaron@databricks.com>
+ 2014-03-25 13:28:13 -0700
+ Commit: 8237df8, github.com/apache/spark/pull/222
+
+ SPARK-1319: Fix scheduler to account for tasks using > 1 CPUs.
+ Shivaram Venkataraman <shivaram@eecs.berkeley.edu>
+ 2014-03-25 13:05:30 -0700
+ Commit: f8111ea, github.com/apache/spark/pull/219
+
+ SPARK-1316. Remove use of Commons IO
+ Sean Owen <sowen@cloudera.com>
+ 2014-03-25 10:21:25 -0700
+ Commit: 71d4ed2, github.com/apache/spark/pull/226
+
+ Add more hive compatability tests to whitelist
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-25 09:57:26 -0700
+ Commit: 134ace7, github.com/apache/spark/pull/220
+
+ SPARK-1286: Make usage of spark-env.sh idempotent
+ Aaron Davidson <aaron@databricks.com>
+ 2014-03-24 22:24:21 -0700
+ Commit: 007a733, github.com/apache/spark/pull/184
+
+ Unify the logic for column pruning, projection, and filtering of table scans.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-24 22:15:51 -0700
+ Commit: b637f2d, github.com/apache/spark/pull/213
+
+ SPARK-1128: set hadoop task properties when constructing HadoopRDD
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-03-24 21:55:03 -0700
+ Commit: 5140598, github.com/apache/spark/pull/101
+
+ SPARK-1094 Support MiMa for reporting binary compatibility accross versions.
+ Patrick Wendell <pwendell@gmail.com>, Prashant Sharma <prashant.s@imaginea.com>, Prashant Sharma <scrapcodes@gmail.com>
+ 2014-03-24 21:20:23 -0700
+ Commit: dc126f2, github.com/apache/spark/pull/207
+
+ SPARK-1294 Fix resolution of uppercase field names using a HiveContext.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-24 19:24:22 -0700
+ Commit: 8043b7b, github.com/apache/spark/pull/202
+
+ HOT FIX: Exclude test files from RAT
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-24 13:38:07 -0700
+ Commit: 56db8a2
+
+ SPARK-1144 Added license and RAT to check licenses.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-24 08:44:12 -0700
+ Commit: 21109fb, github.com/apache/spark/pull/125
+
+ [SPARK-1212] Adding sparse data support and update KMeans
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-23 17:34:02 -0700
+ Commit: 80c2968, github.com/apache/spark/pull/117
+
+ Fixed coding style issues in Spark SQL
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-03-23 15:21:40 -0700
+ Commit: 8265dc7, github.com/apache/spark/pull/208
+
+ [SPARK-1292] In-memory columnar representation for Spark SQL
+ Cheng Lian <lian@databricks.com>, Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-03-23 12:08:55 -0700
+ Commit: 57a4379, github.com/apache/spark/pull/205
+
+ SPARK-1254. Supplemental fix for HTTPS on Maven Central
+ Sean Owen <sowen@cloudera.com>
+ 2014-03-23 10:57:01 -0700
+ Commit: abf6714, github.com/apache/spark/pull/209
+
+ Fix to Stage UI to display numbers on progress bar
+ Emtiaz Ahmed <emtiazahmed@gmail.com>
+ 2014-03-21 18:05:53 -0700
+ Commit: 646e554, github.com/apache/spark/pull/201
+
+ Add asCode function for dumping raw tree representations.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-21 16:54:06 -0700
+ Commit: d780983, github.com/apache/spark/pull/200
+
+ Make SQL keywords case-insensitive
+ Matei Zaharia <matei@databricks.com>
+ 2014-03-21 16:53:18 -0700
+ Commit: dab5439, github.com/apache/spark/pull/193
+
+ SPARK-1279: Fix improper use of SimpleDateFormat
+ zsxwing <zsxwing@gmail.com>
+ 2014-03-21 16:07:22 -0700
+ Commit: 2c0aa22, github.com/apache/spark/pull/179
+
+ Add hive test files to repository. Remove download script.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-21 15:05:45 -0700
+ Commit: 7e17fe6, github.com/apache/spark/pull/199
+
+ Fix maven jenkins: Add explicit init for required tables in SQLQuerySuite
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-20 22:31:11 -0700
+ Commit: e09139d, github.com/apache/spark/pull/191
+
+ SPARK-1251 Support for optimizing and executing structured queries
+ Michael Armbrust <michael@databricks.com>, Yin Huai <huaiyin.thu@gmail.com>, Reynold Xin <rxin@apache.org>, Lian, Cheng <rhythm.mail@gmail.com>, Andre Schumacher <andre.schumacher@iki.fi>, Yin Huai <huai@cse.ohio-state.edu>, Timothy Chen <tnachen@gmail.com>, Cheng Lian <lian.cs.zju@gmail.com>, Timothy Chen <tnachen@apache.org>, Henry Cook <henry.m.cook+github@gmail.com>, Mark Hamstra <markhamstra@gmail.com>
+ 2014-03-20 18:03:20 -0700
+ Commit: 9aadcff, github.com/apache/spark/pull/146
+
+ [Hot Fix #42] Do not stop SparkUI if bind() is not called
+ Andrew Or <andrewor14@gmail.com>
+ 2014-03-20 14:13:16 -0700
+ Commit: ca76423, github.com/apache/spark/pull/188
+
+ Principal Component Analysis
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-03-20 10:39:20 -0700
+ Commit: 66a03e5, github.com/apache/spark/pull/88
+
+ Revert "SPARK-1099:Spark's local mode should probably respect spark.cores.max by default"
+ Aaron Davidson <aaron@databricks.com>
+ 2014-03-19 17:56:48 -0700
+ Commit: ffe272d
+
+ SPARK-1099:Spark's local mode should probably respect spark.cores.max by default
+ qqsun8819 <jin.oyj@alibaba-inc.com>
+ 2014-03-19 16:33:54 -0700
+ Commit: 1678931, github.com/apache/spark/pull/110
+
+ Added doctest for map function in rdd.py
+ Jyotiska NK <jyotiska123@gmail.com>
+ 2014-03-19 14:04:45 -0700
+ Commit: 67fa71c, github.com/apache/spark/pull/177
+
+ [SPARK-1132] Persisting Web UI through refactoring the SparkListener interface
+ Andrew Or <andrewor14@gmail.com>, andrewor14 <andrewor14@gmail.com>
+ 2014-03-19 13:17:01 -0700
+ Commit: 79d07d6, github.com/apache/spark/pull/42
+
+ Bugfixes/improvements to scheduler
+ Mridul Muralidharan <mridul@gmail.com>
+ 2014-03-19 12:46:55 -0700
+ Commit: ab747d3, github.com/apache/spark/pull/159
+
+ SPARK-1203 fix saving to hdfs from yarn
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-19 08:09:20 -0500
+ Commit: 6112270, github.com/apache/spark/pull/173
+
+ bugfix: Wrong "Duration" in "Active Stages" in stages page
+ shiyun.wxm <shiyun.wxm@taobao.com>
+ 2014-03-19 01:42:34 -0700
+ Commit: d55ec86, github.com/apache/spark/pull/170
+
+ Bundle tachyon: SPARK-1269
+ Nick Lanham <nick@afternight.org>
+ 2014-03-18 22:04:57 -0700
+ Commit: a18ea00, github.com/apache/spark/pull/137
+
+ Fix SPARK-1256: Master web UI and Worker web UI returns a 404 error
+ witgo <witgo@qq.com>
+ 2014-03-18 21:57:47 -0700
+ Commit: cc2655a, github.com/apache/spark/pull/150
+
+ [SPARK-1266] persist factors in implicit ALS
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-18 17:20:42 -0700
+ Commit: f9d8a83, github.com/apache/spark/pull/165
+
+ [SPARK-1260]: faster construction of features with intercept
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-18 15:14:13 -0700
+ Commit: e108b9a, github.com/apache/spark/pull/161
+
+ Update copyright year in NOTICE to 2014
+ Matei Zaharia <matei@databricks.com>
+ 2014-03-18 14:34:31 -0700
+ Commit: 79e547f, github.com/apache/spark/pull/174
+
+ SPARK-1102: Create a saveAsNewAPIHadoopDataset method
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-18 11:06:18 -0700
+ Commit: 2fa26ec, github.com/apache/spark/pull/12
+
+ Revert "SPARK-1236 - Upgrade Jetty to 9.1.3.v20140225."
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-18 00:46:03 -0700
+ Commit: e7423d4, github.com/apache/spark/pull/167
+
+ Spark 1246 add min max to stat counter
+ Dan McClary <dan.mcclary@gmail.com>
+ 2014-03-18 00:45:47 -0700
+ Commit: e3681f2, github.com/apache/spark/pull/144
+
+ [Spark-1261] add instructions for running python examples to doc overview page
+ Diana Carroll <dcarroll@cloudera.com>
+ 2014-03-17 17:35:51 -0700
+ Commit: 087eedc, github.com/apache/spark/pull/162
+
+ SPARK-1244: Throw exception if map output status exceeds frame size
+ Patrick Wendell <pwendell@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-03-17 14:03:32 -0700
+ Commit: 796977a, github.com/apache/spark/pull/152
+
+ SPARK-1240: handle the case of empty RDD when takeSample
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-16 22:14:59 -0700
+ Commit: dc96546, github.com/apache/spark/pull/135
+
+ SPARK-1255: Allow user to pass Serializer object instead of class name for shuffle.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-16 09:57:21 -0700
+ Commit: f5486e9, github.com/apache/spark/pull/149
+
+ SPARK-1254. Consolidate, order, and harmonize repository declarations in Maven/SBT builds
+ Sean Owen <sowen@cloudera.com>
+ 2014-03-15 16:43:27 -0700
+ Commit: 97e4459, github.com/apache/spark/pull/145
+
+ Fix serialization of MutablePair. Also provide an interface for easy updating.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-14 11:40:26 -0700
+ Commit: e19044c, github.com/apache/spark/pull/141
+
+ [bugfix] wrong client arg, should use executor-cores
+ Tianshuo Deng <tdeng@twitter.com>
+ 2014-03-13 20:27:36 -0700
+ Commit: 181b130, github.com/apache/spark/pull/138
+
+ SPARK-1236 - Upgrade Jetty to 9.1.3.v20140225.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-13 12:16:04 -0700
+ Commit: ca4bf8c, github.com/apache/spark/pull/113
+
+ SPARK-1183. Don't use "worker" to mean executor
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-13 12:11:33 -0700
+ Commit: 6983732, github.com/apache/spark/pull/120
+
+ [SPARK-1237, 1238] Improve the computation of YtY for implicit ALS
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-13 00:43:19 -0700
+ Commit: e4e8d8f, github.com/apache/spark/pull/131
+
+ SPARK-1019: pyspark RDD take() throws an NPE
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-12 23:16:59 -0700
+ Commit: 4ea23db, github.com/apache/spark/pull/112
+
+ hot fix for PR105 - change to Java annotation
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-12 19:49:18 -0700
+ Commit: 6bd2eaa, github.com/apache/spark/pull/133
+
+ Fix example bug: compile error
+ jianghan <jianghan@xiaomi.com>
+ 2014-03-12 19:46:12 -0700
+ Commit: 31a7040, github.com/apache/spark/pull/132
+
+ SPARK-1160: Deprecate toArray in RDD
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-12 17:43:12 -0700
+ Commit: 9032f7c, github.com/apache/spark/pull/105
+
+ SPARK-1162 Added top in python.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-12 15:57:44 -0700
+ Commit: b8afe30, github.com/apache/spark/pull/93
+
+ Fix #SPARK-1149 Bad partitioners can cause Spark to hang
+ liguoqiang <liguoqiang@rd.tuan800.com>
+ 2014-03-12 12:59:51 -0700
+ Commit: 5d1ec64, github.com/apache/spark/pull/44
+
+ [SPARK-1233] Fix running hadoop 0.23 due to java.lang.NoSuchFieldException: DEFAULT_M...
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-12 11:25:41 -0700
+ Commit: b5162f4, github.com/apache/spark/pull/129
+
+ [SPARK-1232] Fix the hadoop 0.23 yarn build
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-12 10:32:01 -0700
+ Commit: c8c59b3, github.com/apache/spark/pull/127
+
+ Spark-1163, Added missing Python RDD functions
+ prabinb <prabin.banka@imaginea.com>
+ 2014-03-11 23:57:05 -0700
+ Commit: af7f2f1, github.com/apache/spark/pull/92
+
+ SPARK-1064
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-11 22:39:17 -0700
+ Commit: 2409af9, github.com/apache/spark/pull/102
+
+ SPARK-1167: Remove metrics-ganglia from default build due to LGPL issues...
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-11 11:16:59 -0700
+ Commit: 16788a6, github.com/apache/spark/pull/108
+
+ SPARK-1211. In ApplicationMaster, set spark.master system property to "y...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-10 17:42:33 -0700
+ Commit: 2a2c964, github.com/apache/spark/pull/118
+
+ SPARK-1205: Clean up callSite/origin/generator.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-10 16:28:41 -0700
+ Commit: 2a51617, github.com/apache/spark/pull/106
+
+ SPARK-1168, Added foldByKey to pyspark.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-10 13:37:11 -0700
+ Commit: a59419c, github.com/apache/spark/pull/115
+
+ [SPARK-972] Added detailed callsite info for ValueError in context.py (resubmitted)
+ jyotiska <jyotiska123@gmail.com>
+ 2014-03-10 13:34:49 -0700
+ Commit: f551898, github.com/apache/spark/pull/34
+
+ SPARK-977 Added Python RDD.zip function
+ Prabin Banka <prabin.banka@imaginea.com>
+ 2014-03-10 13:27:00 -0700
+ Commit: e1e09e0, github.com/apache/spark/pull/76
+
+ maintain arbitrary state data for each key
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-03-09 22:42:12 -0700
+ Commit: 5d98cfc, github.com/apache/spark/pull/114
+
+ SPARK-782 Clean up for ASM dependency.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-09 13:17:07 -0700
+ Commit: b9be160, github.com/apache/spark/pull/100
+
+ Fix markup errors introduced in #33 (SPARK-1189)
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-09 11:57:06 -0700
+ Commit: faf4cad, github.com/apache/spark/pull/111
+
+ Add timeout for fetch file
+ Jiacheng Guo <guojc03@gmail.com>
+ 2014-03-09 11:37:44 -0700
+ Commit: f6f9d02, github.com/apache/spark/pull/98
+
+ SPARK-929: Fully deprecate usage of SPARK_MEM
+ Aaron Davidson <aaron@databricks.com>
+ 2014-03-09 11:08:39 -0700
+ Commit: 52834d7, github.com/apache/spark/pull/99
+
+ SPARK-1190: Do not initialize log4j if slf4j log4j backend is not being used
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-08 16:02:42 -0800
+ Commit: e59a3b6, github.com/apache/spark/pull/107
+
+ Update junitxml plugin to the latest version to avoid recompilation in every SBT command.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-08 12:40:26 -0800
+ Commit: c2834ec, github.com/apache/spark/pull/104
+
+ [SPARK-1194] Fix the same-RDD rule for cache replacement
+ Cheng Lian <lian.cs.zju@gmail.com>
+ 2014-03-07 23:26:46 -0800
+ Commit: 0b7b7fd, github.com/apache/spark/pull/96
+
+ Allow sbt to use more than 1G of heap.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-07 23:23:59 -0800
+ Commit: 8ad486a, github.com/apache/spark/pull/103
+
+ SPARK-1193. Fix indentation in pom.xmls
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-07 23:10:35 -0800
+ Commit: a99fb37, github.com/apache/spark/pull/91
+
+ Spark 1165 rdd.intersection in python and java
+ Prashant Sharma <prashant.s@imaginea.com>, Prashant Sharma <scrapcodes@gmail.com>
+ 2014-03-07 18:48:07 -0800
+ Commit: 6e730ed, github.com/apache/spark/pull/80
+
+ SPARK-1195: set map_input_file environment variable in PipedRDD
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-07 10:36:55 -0800
+ Commit: b7cd9e9, github.com/apache/spark/pull/94
+
+ SPARK-1136: Fix FaultToleranceTest for Docker 0.8.1
+ Aaron Davidson <aaron@databricks.com>
+ 2014-03-07 10:22:27 -0800
+ Commit: dabeb6f, github.com/apache/spark/pull/5
+
+ Small clean-up to flatmap tests
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-06 17:57:31 -0800
+ Commit: 33baf14
+
+ Example for cassandra CQL read/write from spark
+ anitatailor <tailor.anita@gmail.com>
+ 2014-03-06 17:46:43 -0800
+ Commit: 9ae919c, github.com/apache/spark/pull/87
+
+ SPARK-1197. Change yarn-standalone to yarn-cluster and fix up running on YARN docs
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-06 17:12:58 -0800
+ Commit: 328c73d, github.com/apache/spark/pull/95
+
+ SPARK-1189: Add Security to Spark - Akka, Http, ConnectionManager, UI use servlets
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-06 18:27:50 -0600
+ Commit: 7edbea4, github.com/apache/spark/pull/33
+
+ SPARK-942: Do not materialize partitions when DISK_ONLY storage level is used
+ Kyle Ellrott <kellrott@gmail.com>
+ 2014-03-06 14:51:00 -0800
+ Commit: 40566e1, github.com/apache/spark/pull/50
+
+ SPARK-1187, Added missing Python APIs
+ Prabin Banka <prabin.banka@imaginea.com>
+ 2014-03-06 12:45:27 -0800
+ Commit: 3d3acef, github.com/apache/spark/pull/75
+
+ SPARK-1156: allow user to login into a cluster without slaves
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-05 21:47:34 -0800
+ Commit: 3eb009f, github.com/apache/spark/pull/58
+
+ SPARK-1184: Update the distribution tar.gz to include spark-assembly jar
+ Mark Grover <mark@apache.org>
+ 2014-03-05 16:52:58 -0800
+ Commit: cda381f, github.com/apache/spark/pull/78
+
+ Improve building with maven docs
+ liguoqiang <liguoqiang@rd.tuan800.com>
+ 2014-03-05 16:38:43 -0800
+ Commit: 51ca7bd, github.com/apache/spark/pull/70
+
+ SPARK-1171: when executor is removed, we should minus totalCores instead of just freeCores on that executor
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-03-05 14:00:28 -0800
+ Commit: a3da508, github.com/apache/spark/pull/63
+
+ SPARK-1109 wrong API docs for pyspark map function
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-04 15:32:43 -0800
+ Commit: 0283665, github.com/apache/spark/pull/73
+
+ SPARK-1178: missing document of spark.scheduler.revive.interval
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-04 10:28:17 -0800
+ Commit: 1865dd6, github.com/apache/spark/pull/74
+
+ SPARK-1164 Deprecated reduceByKeyToDriver as it is an alias for reduceByKeyLocally
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-04 10:27:02 -0800
+ Commit: 2d8e0a0, github.com/apache/spark/pull/72
+
+ [java8API] SPARK-964 Investigate the potential for using JDK 8 lambda expressions for the Java/Scala APIs
+ Prashant Sharma <prashant.s@imaginea.com>, Patrick Wendell <pwendell@gmail.com>
+ 2014-03-03 22:31:30 -0800
+ Commit: 181ec50, github.com/apache/spark/pull/17
+
+ Remove broken/unused Connection.getChunkFIFO method.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-03-03 21:27:18 -0800
+ Commit: b14ede7, github.com/apache/spark/pull/69
+
+ SPARK-1158: Fix flaky RateLimitedOutputStreamSuite.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-03 21:24:19 -0800
+ Commit: f5ae38a, github.com/apache/spark/pull/55
+
+ Added a unit test for PairRDDFunctions.lookup
+ Bryn Keller <bryn.keller@intel.com>
+ 2014-03-03 16:38:57 -0800
+ Commit: 923dba5, github.com/apache/spark/pull/36
+
+ Remove the remoteFetchTime metric.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-03-03 16:12:00 -0800
+ Commit: b55cade, github.com/apache/spark/pull/62
+
+ update proportion of memory
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-03-03 14:41:25 -0800
+ Commit: 9d225a9, github.com/apache/spark/pull/66
+
+ Removed accidentally checked in comment
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-03-03 14:39:49 -0800
+ Commit: 369aad6, github.com/apache/spark/pull/61
+
+ SPARK-1173. (#2) Fix typo in Java streaming example.
+ Aaron Kimball <aaron@magnify.io>
+ 2014-03-02 23:48:48 -0800
+ Commit: f65c1f3, github.com/apache/spark/pull/65
+
+ SPARK-1173. Improve scala streaming docs.
+ Aaron Kimball <aaron@magnify.io>
+ 2014-03-02 23:26:47 -0800
+ Commit: 2b53447, github.com/apache/spark/pull/64
+
+ Add Jekyll tag to isolate "production-only" doc components.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-02 18:19:01 -0800
+ Commit: 55a4f11, github.com/apache/spark/pull/56
+
+ SPARK-1121: Include avro for yarn-alpha builds
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-02 15:18:19 -0800
+ Commit: c3f5e07, github.com/apache/spark/pull/49
+
+ SPARK-1084.2 (resubmitted)
+ Sean Owen <sowen@cloudera.com>
+ 2014-03-02 14:27:53 -0800
+ Commit: fd31adb, github.com/apache/spark/pull/32
+
+ Ignore RateLimitedOutputStreamSuite for now.
+ Reynold Xin <rxin@apache.org>
+ 2014-03-02 14:27:19 -0800
+ Commit: 353ac6b, github.com/apache/spark/pull/54
+
+ SPARK-1137: Make ZK PersistenceEngine not crash for wrong serialVersionUID
+ Aaron Davidson <aaron@databricks.com>
+ 2014-03-02 01:00:42 -0800
+ Commit: 46bcb95, github.com/apache/spark/pull/4
+
+ Remove remaining references to incubation
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-02 01:00:16 -0800
+ Commit: 1fd2bfd, github.com/apache/spark/pull/51
+
+ Update io.netty from 4.0.13 Final to 4.0.17.Final
+ Binh Nguyen <ngbinh@gmail.com>, Binh Nguyen <ngbinh@gmail.com>
+ 2014-03-02 00:48:50 -0800
+ Commit: b70823c, github.com/apache/spark/pull/41
+
+ Merge the old sbt-launch-lib.bash with the new sbt-launcher jar downloading logic.
+ Michael Armbrust <michael@databricks.com>
+ 2014-03-02 00:35:23 -0800
+ Commit: 012bd5f, github.com/apache/spark/pull/14
+
+ Initialized the regVal for first iteration in SGD optimizer
+ DB Tsai <dbtsai@alpinenow.com>
+ 2014-03-02 00:31:59 -0800
+ Commit: 6fc76e4, github.com/apache/spark/pull/40
+
+ [SPARK-1100] prevent Spark from overwriting directory silently
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-01 17:27:54 -0800
+ Commit: 3a8b698, github.com/apache/spark/pull/11
+
+ [SPARK-1150] fix repo location in create script (re-open)
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-01 17:24:53 -0800
+ Commit: fe195ae, github.com/apache/spark/pull/52
+
+ Revert "[SPARK-1150] fix repo location in create script"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-01 17:15:38 -0800
+ Commit: ec992e1
+
+ [SPARK-1150] fix repo location in create script
+ Mark Grover <mark@apache.org>
+ 2014-03-01 16:21:22 -0800
+ Commit: 9aa0957, github.com/apache/spark/pull/48
+
+ [SPARK-979] Randomize order of offers.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-03-01 11:24:22 -0800
+ Commit: 556c566, github.com/apache/spark/pull/27
+
+ SPARK-1151: Update dev merge script to use spark.git instead of incubator-spark
+ Thomas Graves <tgraves@apache.org>
+ 2014-02-28 18:28:33 -0800
+ Commit: 4ba3f70, github.com/apache/spark/pull/47
+
+ SPARK-1051. On YARN, executors don't doAs submitting user
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-02-28 12:43:01 -0600
+ Commit: 46dff34, github.com/apache/spark/pull/29
+
+ SPARK-1032. If Yarn app fails before registering, app master stays aroun...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-02-28 09:40:47 -0600
+ Commit: 5f419bf, github.com/apache/spark/pull/28
+
+ Remote BlockFetchTracker trait
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-02-27 21:52:55 -0800
+ Commit: edf8a56, github.com/apache/spark/pull/39
+
+ Removed reference to incubation in Spark user docs.
+ Reynold Xin <rxin@apache.org>
+ 2014-02-27 21:13:22 -0800
+ Commit: 40e080a, github.com/apache/spark/pull/2
+
+ [HOTFIX] Patching maven build after #6 (SPARK-1121).
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-02-27 15:06:20 -0800
+ Commit: c42557b, github.com/apache/spark/pull/37
+
+ SPARK 1084.1 (resubmitted)
+ Sean Owen <sowen@cloudera.com>
+ 2014-02-27 11:12:21 -0800
+ Commit: 12bbca2, github.com/apache/spark/pull/31
+
+ Show Master status on UI page
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-02-26 23:51:32 -0800
+ Commit: aace2c0, github.com/apache/spark/pull/24
+
+ [SPARK-1089] fix the regression problem on ADD_JARS in 0.9
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-26 23:42:15 -0800
+ Commit: 345df5f, github.com/apache/spark/pull/13
+
+ SPARK-1121 Only add avro if the build is for Hadoop 0.23.X and SPARK_YARN is set
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-02-26 23:40:49 -0800
+ Commit: 6ccd6c5, github.com/apache/spark/pull/6
+
+ SPARK-1129: use a predefined seed when seed is zero in XORShiftRandom
+ Xiangrui Meng <meng@databricks.com>
+ 2014-02-26 23:22:30 -0800
+ Commit: 5a3ad10, github.com/apache/spark/pull/645
+
+ Remove references to ClusterScheduler (SPARK-1140)
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-02-26 22:52:42 -0800
+ Commit: 71f69d6, github.com/apache/spark/pull/9
+
+ Updated link for pyspark examples in docs
+ Jyotiska NK <jyotiska123@gmail.com>
+ 2014-02-26 21:37:04 -0800
+ Commit: 2645035, github.com/apache/spark/pull/22
+
+ Deprecated and added a few java api methods for corresponding scala api.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-02-26 21:17:44 -0800
+ Commit: 0e40e2b, github.com/apache/spark/pull/19
+
+ Removed reference to incubation in README.md.
+ Reynold Xin <rxin@apache.org>
+ 2014-02-26 16:52:26 -0800
+ Commit: 84f7ca1, github.com/apache/spark/pull/1
+
+ SPARK-1115: Catch depickling errors
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-02-26 14:50:37 -0800
+ Commit: 12738c1, github.com/apache/spark/pull/644
+
+ SPARK-1135: fix broken anchors in docs
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-26 11:20:16 -0800
+ Commit: c86eec5, github.com/apache/spark/pull/3
+
+ SPARK-1078: Replace lift-json with json4s-jackson.
+ William Benton <willb@redhat.com>
+ 2014-02-26 10:09:50 -0800
+ Commit: fbedc8e, github.com/apache/spark/pull/582
+
+ SPARK-1053. Don't require SPARK_YARN_APP_JAR
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-02-26 10:00:02 -0600
+ Commit: b8a1871, github.com/apache/spark/pull/553
+
+ For SPARK-1082, Use Curator for ZK interaction in standalone cluster
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-02-24 23:20:38 -0800
+ Commit: c852201, github.com/apache/incubator-spark/pull/611
+
+ Graph primitives2
+ Semih Salihoglu <semihsalihoglu@gmail.com>
+ 2014-02-24 22:42:30 -0800
+ Commit: 1f4c7f7, github.com/apache/incubator-spark/pull/580
+
+ Include reference to twitter/chill in tuning docs
+ Andrew Ash <andrew@andrewash.com>
+ 2014-02-24 21:13:38 -0800
+ Commit: a4f4fbc, github.com/apache/incubator-spark/pull/647
+
+ For outputformats that are Configurable, call setConf before sending data to them.
+ Bryn Keller <bryn.keller@intel.com>
+ 2014-02-24 17:35:22 -0800
+ Commit: 4d88030, github.com/apache/incubator-spark/pull/638
+
+ d8d190e 2014-02-24 16:58:57 -0800
+ Merge pull request #641 from mateiz/spark-1124-master
+ [SPARK-1124: Fix infinite retries of reduce stage when a map stage failed]
+
+ Fix removal from shuffleToMapStage to search for a key-value pair with our stage instead of using our shuffleID.
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-24 13:14:56 -0800
+ Commit: 0187cef
+
+ SPARK-1124: Fix infinite retries of reduce stage when a map stage failed
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-23 23:45:48 -0800
+ Commit: cd32d5e
+
+ SPARK-1071: Tidy logging strategy and use of log4j
+ Sean Owen <sowen@cloudera.com>
+ 2014-02-23 11:40:55 -0800
+ Commit: c0ef3af, github.com/apache/incubator-spark/pull/570
+
+ [SPARK-1041] remove dead code in start script, remind user to set that in spark-env.sh
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-22 20:21:15 -0800
+ Commit: 437b62f, github.com/apache/incubator-spark/pull/588
+
+ Migrate Java code to Scala or move it to src/main/java
+ Punya Biswal <pbiswal@palantir.com>
+ 2014-02-22 17:53:48 -0800
+ Commit: 29ac7ea, github.com/apache/incubator-spark/pull/605
+
+ [SPARK-1055] fix the SCALA_VERSION and SPARK_VERSION in docker file
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-02-22 15:39:25 -0800
+ Commit: 1aa4f8a, github.com/apache/incubator-spark/pull/634
+
+ doctest updated for mapValues, flatMapValues in rdd.py
+ jyotiska <jyotiska123@gmail.com>
+ 2014-02-22 15:10:31 -0800
+ Commit: 722199f, github.com/apache/incubator-spark/pull/621
+
+ Fixed minor typo in worker.py
+ jyotiska <jyotiska123@gmail.com>
+ 2014-02-22 10:09:50 -0800
+ Commit: 3ff077d, github.com/apache/incubator-spark/pull/630
+
+ SPARK-1117: update accumulator docs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-02-21 22:44:45 -0800
+ Commit: aaec7d4, github.com/apache/incubator-spark/pull/631
+
+ [SPARK-1113] External spilling - fix Int.MaxValue hash code collision bug
+ Andrew Or <andrewor14@gmail.com>
+ 2014-02-21 20:05:39 -0800
+ Commit: fefd22f, github.com/apache/incubator-spark/pull/624
+
+ MLLIB-25: Implicit ALS runs out of memory for moderately large numbers of features
+ Sean Owen <sowen@cloudera.com>
+ 2014-02-21 12:46:12 -0800
+ Commit: c8a4c9b, github.com/apache/incubator-spark/pull/629
+
+ SPARK-1111: URL Validation Throws Error for HDFS URL's
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-02-21 11:11:55 -0800
+ Commit: 45b15e2, github.com/apache/incubator-spark/pull/625
+
+ SPARK-1114: Allow PySpark to use existing JVM and Gateway
+ Ahir Reddy <ahirreddy@gmail.com>
+ 2014-02-20 21:20:39 -0800
+ Commit: 59b1379, github.com/apache/incubator-spark/pull/622
+
+ Super minor: Add require for mergeCombiners in combineByKey
+ Aaron Davidson <aaron@databricks.com>
+ 2014-02-20 16:46:13 -0800
+ Commit: 3fede48, github.com/apache/incubator-spark/pull/623
+
+ MLLIB-22. Support negative implicit input in ALS
+ Sean Owen <sowen@cloudera.com>
+ 2014-02-19 23:44:53 -0800
+ Commit: 9e63f80, github.com/apache/incubator-spark/pull/500
+
+ MLLIB-24: url of "Collaborative Filtering for Implicit Feedback Datasets" in ALS is invalid now
+ Chen Chao <crazyjvm@gmail.com>
+ 2014-02-19 22:06:35 -0800
+ Commit: f9b7d64, github.com/apache/incubator-spark/pull/619
+
+ [SPARK-1105] fix site scala version error in docs
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-19 15:54:03 -0800
+ Commit: 7b012c9, github.com/apache/incubator-spark/pull/618
+
+ SPARK-1106: check key name and identity file before launch a cluster
+ Xiangrui Meng <meng@databricks.com>
+ 2014-02-18 18:30:02 -0800
+ Commit: b61435c, github.com/apache/incubator-spark/pull/617
+
+ Revert "[SPARK-1105] fix site scala version error in doc"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-02-18 17:46:47 -0800
+ Commit: d9bb32a
+
+ [SPARK-1105] fix site scala version error in doc
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-18 16:29:23 -0800
+ Commit: d99773d, github.com/apache/incubator-spark/pull/616
+
+ Optimized imports
+ NirmalReddy <nirmal.reddy@imaginea.com>, NirmalReddy <nirmal_reddy2000@yahoo.com>
+ 2014-02-18 14:44:36 -0800
+ Commit: ccb327a, github.com/apache/incubator-spark/pull/613
+
+ SPARK-1098: Minor cleanup of ClassTag usage in Java API
+ Aaron Davidson <aaron@databricks.com>
+ 2014-02-17 19:23:27 -0800
+ Commit: f74ae0e, github.com/apache/incubator-spark/pull/604
+
+ [SPARK-1090] improvement on spark_shell (help information, configure memory)
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-17 15:12:52 -0800
+ Commit: e0d49ad, github.com/apache/incubator-spark/pull/599
+
+ Fix typos in Spark Streaming programming guide
+ Andrew Or <andrewor14@gmail.com>
+ 2014-02-17 10:59:02 -0800
+ Commit: 767e3ae, github.com/apache/incubator-spark/pull/536
+
+ Worker registration logging fix
+ Andrew Ash <andrew@andrewash.com>
+ 2014-02-17 09:51:55 -0800
+ Commit: c0795cf, github.com/apache/incubator-spark/pull/608
+
+ Add subtractByKey to the JavaPairRDD wrapper
+ Punya Biswal <pbiswal@palantir.com>
+ 2014-02-16 18:55:59 -0800
+ Commit: 5af4477, github.com/apache/incubator-spark/pull/600
+
+ fix for https://spark-project.atlassian.net/browse/SPARK-1052
+ Bijay Bisht <bijay.bisht@gmail.com>
+ 2014-02-16 16:52:57 -0800
+ Commit: 73cfdcf, github.com/apache/incubator-spark/pull/568
+
+ [SPARK-1092] print warning information if user use SPARK_MEM to regulate executor memory usage
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-16 12:25:38 -0800
+ Commit: 1cad381, github.com/apache/incubator-spark/pull/602
+
+ Typo: Standlone -> Standalone
+ Andrew Ash <andrew@andrewash.com>
+ 2014-02-14 10:01:01 -0800
+ Commit: eec4bd1, github.com/apache/incubator-spark/pull/601
+
+ 2414ed3 2014-02-13 14:26:06 -0800
+ Merge pull request #598 from shivaram/master.
+ [Update spark_ec2 to use 0.9.0 by default]
+
+ Add c3 instance types to Spark EC2
+ Christian Lundgren <christian.lundgren@gameanalytics.com>
+ 2014-02-13 12:44:21 -0800
+ Commit: 5fa53c0, github.com/apache/incubator-spark/pull/595
+
+ Ported hadoopClient jar for < 1.0.1 fix
+ Bijay Bisht <bijay.bisht@gmail.com>
+ 2014-02-12 23:42:10 -0800
+ Commit: a3bb861, github.com/apache/incubator-spark/pull/584
+
+ SPARK-1073 Keep GitHub pull request title as commit summary
+ Andrew Ash <andrew@andrewash.com>
+ 2014-02-12 23:23:06 -0800
+ Commit: 6ee0ad8, github.com/apache/incubator-spark/pull/574
+
+ 7fe7a55 2014-02-12 22:35:09 -0800
+ Merge pull request #592 from rxin/test.
+ [SPARK-1088: Create a script for running tests so we can have version specific testing on Jenkins.]
+
+ 7e29e02 2014-02-12 16:26:25 -0800
+ Merge pull request #591 from mengxr/transient-new.
+ [SPARK-1076: [Fix #578] add @transient to some vals]
+
+ 2bea070 2014-02-12 10:47:52 -0800
+ Merge pull request #589 from mengxr/index.
+ [SPARK-1076: Convert Int to Long to avoid overflow]
+
+ e733d65 2014-02-12 00:42:42 -0800
+ Merge pull request #578 from mengxr/rank.
+ [SPARK-1076: zipWithIndex and zipWithUniqueId to RDD]
+
+ 68b2c0d 2014-02-11 22:39:48 -0800
+ Merge pull request #583 from colorant/zookeeper.
+ [Minor fix for ZooKeeperPersistenceEngine to use configured working dir]
+
+ b0dab1b 2014-02-11 14:48:59 -0800
+ Merge pull request #571 from holdenk/switchtobinarysearch.
+ [SPARK-1072 Use binary search when needed in RangePartioner]
+
+ ba38d98 2014-02-11 14:46:22 -0800
+ Merge pull request #577 from hsaputra/fix_simple_streaming_doc.
+ [SPARK-1075 Fix doc in the Spark Streaming custom receiver closing bracket in the class constructor]
+
+ 4afe6cc 2014-02-10 22:28:39 -0800
+ Merge pull request #579 from CrazyJvm/patch-1.
+ ["in the source DStream" rather than "int the source DStream"]
+
+ d6a9bdc 2014-02-09 23:35:06 -0800
+ Revert "Merge pull request #560 from pwendell/logging. Closes #560."
+ [This reverts commit b6d40b782327188a25ded5b22790552121e5271f.]
+
+ 919bd7f 2014-02-09 22:17:52 -0800
+ Merge pull request #567 from ScrapCodes/style2.
+ [SPARK-1058, Fix Style Errors and Add Scala Style to Spark Build. Pt 2]
+
+ 2182aa3 2014-02-09 15:19:50 -0800
+ Merge pull request #566 from martinjaggi/copy-MLlib-d.
+ [new MLlib documentation for optimization, regression and classification]
+
+ afc8f3c 2014-02-09 13:57:29 -0800
+ Merge pull request #551 from qqsun8819/json-protocol.
+ [[SPARK-1038] Add more fields in JsonProtocol and add tests that verify the JSON itself]
+
+ 94ccf86 2014-02-09 13:54:27 -0800
+ Merge pull request #569 from pwendell/merge-fixes.
+ [Fixes bug where merges won't close associated pull request.]
+
+ b69f8b2 2014-02-09 10:09:19 -0800
+ Merge pull request #557 from ScrapCodes/style. Closes #557.
+ [SPARK-1058, Fix Style Errors and Add Scala Style to Spark Build.]
+
+ b6dba10 2014-02-08 23:39:17 -0800
+ Merge pull request #556 from CodingCat/JettyUtil. Closes #556.
+ [[SPARK-1060] startJettyServer should explicitly use IP information]
+
+ 2ef37c9 2014-02-08 23:36:48 -0800
+ Merge pull request #562 from jyotiska/master. Closes #562.
+ [Added example Python code for sort]
+
+ b6d40b7 2014-02-08 23:35:31 -0800
+ Merge pull request #560 from pwendell/logging. Closes #560.
+ [[WIP] SPARK-1067: Default log4j initialization causes errors for those not using log4j]
+
+ f892da8 2014-02-08 23:13:34 -0800
+ Merge pull request #565 from pwendell/dev-scripts. Closes #565.
+ [SPARK-1066: Add developer scripts to repository.]
+
+ c2341c9 2014-02-08 16:00:43 -0800
+ Merge pull request #542 from markhamstra/versionBump. Closes #542.
+ [Version number to 1.0.0-SNAPSHOT]
+
+ f0ce736 2014-02-08 12:59:48 -0800
+ Merge pull request #561 from Qiuzhuang/master. Closes #561.
+ [Kill drivers in postStop() for Worker.]
+
+ 7805080 2014-02-08 12:24:08 -0800
+ Merge pull request #454 from jey/atomic-sbt-download. Closes #454.
+ [Make sbt download an atomic operation]
+
+ fabf174 2014-02-08 11:39:13 -0800
+ Merge pull request #552 from martinjaggi/master. Closes #552.
+ [tex formulas in the documentation]
+
+ 3a9d82c 2014-02-06 22:38:36 -0800
+ Merge pull request #506 from ash211/intersection. Closes #506.
+ [SPARK-1062 Add rdd.intersection(otherRdd) method]
+
+ 1896c6e 2014-02-06 22:05:53 -0800
+ Merge pull request #533 from andrewor14/master. Closes #533.
+ [External spilling - generalize batching logic]
+
+ 0b448df 2014-02-06 16:15:24 -0800
+ Merge pull request #450 from kayousterhout/fetch_failures. Closes #450.
+ [Only run ResubmitFailedStages event after a fetch fails]
+
+ 18ad59e 2014-02-06 16:10:48 -0800
+ Merge pull request #321 from kayousterhout/ui_kill_fix. Closes #321.
+ [Inform DAG scheduler about all started/finished tasks.]
+
+ 446403b 2014-02-06 15:41:16 -0800
+ Merge pull request #554 from sryza/sandy-spark-1056. Closes #554.
+ [SPARK-1056. Fix header comment in Executor to not imply that it's only u...]
+
+ 084839b 2014-02-06 14:58:35 -0800
+ Merge pull request #498 from ScrapCodes/python-api. Closes #498.
+ [Python api additions]
+
+ 79c9552 2014-02-05 23:38:12 -0800
+ Merge pull request #545 from kayousterhout/fix_progress. Closes #545.
+ [Fix off-by-one error with task progress info log.]
+
+ 3802096 2014-02-05 23:37:07 -0800
+ Merge pull request #526 from tgravescs/yarn_client_stop_am_fix. Closes #526.
+ [spark on yarn - yarn-client mode doesn't always exit immediately]
+
+ 18c4ee7 2014-02-05 22:08:47 -0800
+ Merge pull request #549 from CodingCat/deadcode_master. Closes #549.
+ [remove actorToWorker in master.scala, which is actually not used]
+
+ cc14ba9 2014-02-05 12:44:24 -0800
+ Merge pull request #544 from kayousterhout/fix_test_warnings. Closes #544.
+ [Fixed warnings in test compilation.]
+
+ f7fd80d 2014-02-05 10:29:45 -0800
+ Merge pull request #540 from sslavic/patch-3. Closes #540.
+ [Fix line end character stripping for Windows]
+
+ 9209287 2014-02-04 09:47:11 -0800
+ Merge pull request #534 from sslavic/patch-1. Closes #534.
+ [Fixed wrong path to compute-classpath.cmd]
+
+ 0c05cd3 2014-02-04 09:45:46 -0800
+ Merge pull request #535 from sslavic/patch-2. Closes #535.
+ [Fixed typo in scaladoc]
+
+ 23af00f 2014-02-03 13:02:09 -0800
+ Merge pull request #528 from mengxr/sample. Closes #528.
+ [ Refactor RDD sampling and add randomSplit to RDD (update)]
+
+ 1625d8c 2014-02-03 11:25:39 -0800
+ Merge pull request #530 from aarondav/cleanup. Closes #530.
+ [Remove explicit conversion to PairRDDFunctions in cogroup()]
+
+ 0386f42 2014-02-02 21:51:17 -0800
+ Merge pull request #529 from hsaputra/cleanup_right_arrowop_scala
+ [Change the ⇒ character (maybe from scalariform) to => in Scala code for style consistency]
+
+ a8cf3ec 2014-01-31 16:52:02 -0800
+ Merge pull request #527 from ankurdave/graphx-assembly-pom
+ [Add GraphX to assembly/pom.xml]
+
+ ac712e4 2014-01-30 09:33:18 -0800
+ Merge pull request #524 from rxin/doc
+ [Added spark.shuffle.file.buffer.kb to configuration doc.]
+
+ 0ff38c2 2014-01-29 12:44:54 -0800
+ Merge pull request #494 from tyro89/worker_registration_issue
+ [Issue with failed worker registrations]
+
+ 7930209 2014-01-28 21:51:05 -0800
+ Merge pull request #497 from tdas/docs-update
+ [Updated Spark Streaming Programming Guide]
+
+ f8c742c 2014-01-28 21:30:20 -0800
+ Merge pull request #523 from JoshRosen/SPARK-1043
+ [Switch from MUTF8 to UTF8 in PySpark serializers.]
+
+ Switch from MUTF8 to UTF8 in PySpark serializers.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-28 19:50:26 -0800
+ Commit: 1381fc7
+
+ 84670f2 2014-01-27 17:08:35 -0800
+ Merge pull request #466 from liyinan926/file-overwrite-new
+ [Allow files added through SparkContext.addFile() to be overwritten]
+
+ 3d5c03e 2014-01-27 16:27:01 -0800
+ Merge pull request #516 from sarutak/master
+ [modified SparkPluginBuild.scala to use https protocol for accessing gith...]
+
+ f16c21e 2014-01-27 14:24:06 -0800
+ Merge pull request #490 from hsaputra/modify_checkoption_with_isdefined
+ [Replace the check for None Option with isDefined and isEmpty in Scala code]
+
+ f67ce3e 2014-01-27 11:15:51 -0800
+ Merge pull request #460 from srowen/RandomInitialALSVectors
+ [Choose initial user/item vectors uniformly on the unit sphere]
+
+ modified SparkPluginBuild.scala to use https protocol for accessing github.
+ sarutak <sarutak@oss.nttdata.co.jp>
+ 2014-01-27 17:00:26 +0900
+ Commit: 6a5af7b
+
+ c40619d 2014-01-25 22:41:30 -0800
+ Merge pull request #504 from JoshRosen/SPARK-1025
+ [Fix PySpark hang when input files are deleted (SPARK-1025)]
+
+ c66a2ef 2014-01-25 22:36:07 -0800
+ Merge pull request #511 from JoshRosen/SPARK-1040
+ [Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040)]
+
+ Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040)
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-25 16:39:20 -0800
+ Commit: 740e865
+
+ Increase JUnit test verbosity under SBT.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-25 16:32:44 -0800
+ Commit: 531d9d7
+
+ 05be704 2014-01-23 20:53:18 -0800
+ Merge pull request #505 from JoshRosen/SPARK-1026
+ [Deprecate mapPartitionsWithSplit in PySpark (SPARK-1026)]
+
+ Deprecate mapPartitionsWithSplit in PySpark.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-23 20:01:36 -0800
+ Commit: 4cebb79
+
+ 3d6e754 2014-01-23 19:47:00 -0800
+ Merge pull request #503 from pwendell/master
+ [Fix bug on read-side of external sort when using Snappy.]
+
+ Minor fix
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-23 19:23:12 -0800
+ Commit: ff44732
+
+ c319617 2014-01-23 19:11:59 -0800
+ Merge pull request #502 from pwendell/clone-1
+ [Remove Hadoop object cloning and warn users making Hadoop RDD's.]
+
+ cad3002 2014-01-23 19:08:34 -0800
+ Merge pull request #501 from JoshRosen/cartesian-rdd-fixes
+ [Fix two bugs in PySpark cartesian(): SPARK-978 and SPARK-1034]
+
+ Minor changes after auditing diff from earlier version
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-23 18:30:11 -0800
+ Commit: 268ecbd
+
+ Fix for SPARK-1025: PySpark hang on missing files.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-23 18:10:16 -0800
+ Commit: f830684
+
+ Response to Matei's review
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-23 18:12:40 -0800
+ Commit: c58d4ea
+
+ Fix bug on read-side of external sort when using Snappy.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-23 17:59:42 -0800
+ Commit: 0213b40
+
+ Remove Hadoop object cloning and warn users making Hadoop RDD's.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-23 13:30:54 -0800
+ Commit: 7101017
+
+ Fix SPARK-978: ClassCastException in PySpark cartesian.
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-23 15:09:19 -0800
+ Commit: 6156990
+
+ Fix SPARK-1034: Py4JException on PySpark Cartesian Result
+ Josh Rosen <joshrosen@apache.org>
+ 2014-01-23 13:05:59 -0800
+ Commit: 0035dbb
+
+ fad6aac 2014-01-23 11:14:15 -0800
+ Merge pull request #406 from eklavya/master
+ [Extending Java API coverage]
+
+ a2b47da 2014-01-23 10:48:26 -0800
+ Merge pull request #499 from jianpingjwang/dev1
+ [Replace commons-math with jblas in SVDPlusPlus]
+
+ fixed ClassTag in mapPartitions
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-23 17:40:36 +0530
+ Commit: 60e7457
+
+ Add jblas dependency
+ Jianping J Wang <jianping.j.wang@gmail.com>
+ 2014-01-23 19:54:01 +0800
+ Commit: 19a01c1
+
+ Add jblas dependency
+ Jianping J Wang <jianping.j.wang@gmail.com>
+ 2014-01-23 19:48:39 +0800
+ Commit: a5a513e
+
+ Replace commons-math with jblas
+ Jianping J Wang <jianping.j.wang@gmail.com>
+ 2014-01-23 19:44:30 +0800
+ Commit: cc0fd33
+
+ a1cd185 2014-01-22 19:37:29 -0800
+ Merge pull request #496 from pwendell/master
+ [Fix bug in worker clean-up in UI]
+
+ 034dce2 2014-01-22 18:58:02 -0800
+ Merge pull request #447 from CodingCat/SPARK-1027
+ [fix for SPARK-1027]
+
+ Fix bug in worker clean-up in UI
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-22 18:19:46 -0800
+ Commit: 6285513
+
+ refactor sparkHome to val
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-01-22 19:32:51 -0500
+ Commit: 2b3c461
+
+ 3184fac 2014-01-22 15:45:04 -0800
+ Merge pull request #495 from srowen/GraphXCommonsMathDependency
+ [Fix graphx Commons Math dependency]
+
+ Also add graphx commons-math3 dependeny in sbt build
+ Sean Owen <sowen@cloudera.com>
+ 2014-01-22 22:40:41 +0000
+ Commit: 4476398
+
+ a1238bb 2014-01-22 14:32:59 -0800
+ Merge pull request #492 from skicavs/master
+ [fixed job name and usage information for the JavaSparkPi example]
+
+ Depend on Commons Math explicitly instead of accidentally getting it from Hadoop (which stops working in 2.2.x) and also use the newer commons-math3
+ Sean Owen <sowen@cloudera.com>
+ 2014-01-22 22:25:49 +0000
+ Commit: fd0c5b8
+
+ 576c4a4 2014-01-22 14:10:07 -0800
+ Merge pull request #478 from sryza/sandy-spark-1033
+ [SPARK-1033. Ask for cores in Yarn container requests]
+
+ 5bcfd79 2014-01-22 14:05:48 -0800
+ Merge pull request #493 from kayousterhout/double_add
+ [Fixed bug where task set managers are added to queue twice]
+
+ d009b17 2014-01-22 14:01:30 -0800
+ Merge pull request #315 from rezazadeh/sparsesvd
+ [Sparse SVD]
+
+ Fixed bug where task set managers are added to queue twice
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-01-22 09:49:31 -0800
+ Commit: 19da82c
+
+ fixed job name and usage information for the JavaSparkPi example
+ Kevin Mader <kevinmader@gmail.com>
+ 2014-01-22 15:58:23 +0100
+ Commit: 36f9a64
+
+ Replace the code to check for Option != None with Option.isDefined call in Scala code.
+ Henry Saputra <hsaputra@apache.org>
+ 2014-01-21 23:22:10 -0800
+ Commit: 90ea9d5
+
+ 749f842 2014-01-21 14:53:49 -0800
+ Merge pull request #489 from ash211/patch-6
+ [Clarify spark.default.parallelism]
+
+ Clarify spark.default.parallelism
+ Andrew Ash <andrew@andrewash.com>
+ 2014-01-21 14:49:35 -0800
+ Commit: 069bb94
+
+ f854498 2014-01-21 10:49:54 -0800
+ Merge pull request #469 from ajtulloch/use-local-spark-context-in-tests-for-mllib
+ [[MLlib] Use a LocalSparkContext trait in test suites]
+
+ Fixed import order
+ Andrew Tulloch <andrew@tullo.ch>
+ 2014-01-21 13:34:59 +0000
+ Commit: 3a067b4
+
+ Incorporate Tom's comments - update doc and code to reflect that core requests may not always be honored
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-01-21 00:38:02 -0800
+ Commit: adf4261
+
+ 77b986f 2014-01-21 00:09:42 -0800
+ Merge pull request #480 from pwendell/0.9-fixes
+ [Handful of 0.9 fixes]
+
+ Style clean-up
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 23:42:24 -0800
+ Commit: a9bcc98
+
+ c67d3d8 2014-01-20 23:34:35 -0800
+ Merge pull request #484 from tdas/run-example-fix
+ [Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM.]
+
+ Removed SPARK_MEM from run-examples.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-20 23:15:28 -0800
+ Commit: 65869f8
+
+ Adding small code comment
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 23:11:45 -0800
+ Commit: a917a87
+
+ 6b4eed7 2014-01-20 22:35:45 -0800
+ Merge pull request #449 from CrazyJvm/master
+ [SPARK-1028 : fix "set MASTER automatically fails" bug.]
+
+ 0367981 2014-01-20 22:25:50 -0800
+ Merge pull request #482 from tdas/streaming-example-fix
+ [Added StreamingContext.awaitTermination to streaming examples]
+
+ 7373ffb 2014-01-20 21:44:29 -0800
+ Merge pull request #483 from pwendell/gitignore
+ [Restricting /lib to top level directory in .gitignore]
+
+ Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-20 20:48:59 -0800
+ Commit: e0b741d
+
+ Restricting /lib to top level directory in .gitignore
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 20:39:10 -0800
+ Commit: e437069
+
+ Added StreamingContext.awaitTermination to streaming examples.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-20 20:25:04 -0800
+ Commit: 2e95174
+
+ Avoid matching attempt files in the checkpoint
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 20:02:02 -0800
+ Commit: d46df96
+
+ Remove shuffle files if they are still present on a machine.
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 19:11:22 -0800
+ Commit: de526ad
+
+ Fixing speculation bug
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 19:05:03 -0800
+ Commit: f84400e
+
+ Force use of LZF when spilling data
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 19:00:48 -0800
+ Commit: c324ac1
+
+ Bug fix for reporting of spill output
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 18:34:00 -0800
+ Commit: 1b29914
+
+ Minor fixes
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 18:33:21 -0800
+ Commit: 54867e9
+
+ Removing docs on akka options
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-20 16:35:26 -0800
+ Commit: cdb003e
+
+ SPARK-1033. Ask for cores in Yarn container requests
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-01-19 10:16:25 -0800
+ Commit: 3e85b87
+
+ fix for SPARK-1027
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-01-15 20:46:14 -0500
+ Commit: 29f4b6a
+
+ executor creation failed should not make the worker restart
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-01-15 19:32:50 -0500
+ Commit: f9a95d6
+
+ 792d908 2014-01-19 11:33:11 -0800
+ Merge pull request #470 from tgravescs/fix_spark_examples_yarn
+ [Only log error on missing jar to allow spark examples to jar.]
+
+ 256a355 2014-01-19 10:29:54 -0800
+ Merge pull request #458 from tdas/docs-update
+ [Updated java API docs for streaming, along with very minor changes in the code examples.]
+
+ update comment
+ Thomas Graves <tgraves@apache.org>
+ 2014-01-19 12:21:39 -0600
+ Commit: dd56b21
+
+ Only log error on missing jar to allow spark examples to jar.
+ Thomas Graves <tgraves@apache.org>
+ 2014-01-19 12:16:58 -0600
+ Commit: ceb79a3
+
+ LocalSparkContext for MLlib
+ Andrew Tulloch <andrew@tullo.ch>
+ 2014-01-19 17:51:00 +0000
+ Commit: 720836a
+
+ Addressed comments from Reynold
+ Yinan Li <liyinan926@gmail.com>
+ 2014-01-18 21:28:17 -0800
+ Commit: 584323c
+
+ fe8a354 2014-01-18 16:29:23 -0800
+ Merge pull request #459 from srowen/UpdaterL2Regularization
+ [Correct L2 regularized weight update with canonical form]
+
+ 73dfd42 2014-01-18 16:23:56 -0800
+ Merge pull request #437 from mridulm/master
+ [Minor api usability changes]
+
+ 4c16f79 2014-01-18 16:21:43 -0800
+ Merge pull request #426 from mateiz/py-ml-tests
+ [Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+)]
+
+ bf56995 2014-01-18 16:17:34 -0800
+ Merge pull request #462 from mateiz/conf-file-fix
+ [Remove Typesafe Config usage and conf files to fix nested property names]
+
+ Allow files added through SparkContext.addFile() to be overwritten
+ Yinan Li <liyinan926@gmail.com>
+ 2014-01-17 17:27:25 -0800
+ Commit: fd833e7
+
+ aa981e4 2014-01-18 12:49:21 -0800
+ Merge pull request #461 from pwendell/master
+ [Use renamed shuffle spill config in CoGroupedRDD.scala]
+
+ Use renamed shuffle spill config in CoGroupedRDD.scala
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-18 11:55:10 -0800
+ Commit: 5316bca
+
+ Correct L2 regularized weight update with canonical form
+ Sean Owen <sowen@cloudera.com>
+ 2014-01-18 12:53:01 +0000
+ Commit: e91ad3f
+
+ rename to MatrixSVD
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:40:51 -0800
+ Commit: 85b95d0
+
+ rename to MatrixSVD
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:39:30 -0800
+ Commit: fa32998
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:34:03 -0800
+ Commit: caf97a2
+
+ make example 0-indexed
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:33:03 -0800
+ Commit: 4e96757
+
+ 0index docs
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:31:39 -0800
+ Commit: 5c639d7
+
+ prettify
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 14:14:29 -0800
+ Commit: c9b4845
+
+ add rename computeSVD
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 13:59:05 -0800
+ Commit: dbec69b
+
+ replace this.type with SVD
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 13:57:27 -0800
+ Commit: eb2d8c4
+
+ use 0-indexing
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 13:55:42 -0800
+ Commit: cb13b15
+
+ changes from PR
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-17 13:39:40 -0800
+ Commit: d28bf41
+
+ Address review comment
+ Mridul Muralidharan <mridul@gmail.com>
+ 2014-01-17 18:28:55 +0530
+ Commit: b690e11
+
+ d749d47 2014-01-16 23:18:15 -0800
+ Merge pull request #451 from Qiuzhuang/master
+ [Fixed Window spark shell launch script error.]
+
+ d4fd89e 2014-01-16 23:17:30 -0800
+ Merge pull request #438 from ScrapCodes/clone-records-java-api
+ [Clone records java api]
+
+ adding clone records field to equivaled java apis
+ Prashant Sharma <scrapcodes@gmail.com>
+ 2014-01-14 20:13:55 +0530
+ Commit: fcb4fc6
+
+ Updated java API docs for streaming, along with very minor changes in the code examples.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-16 14:44:02 -0800
+ Commit: 11e6534
+
+ Use method, not variable
+ Mridul Muralidharan <mridul@gmail.com>
+ 2014-01-16 17:26:42 +0530
+ Commit: edd82c5
+
+ Address review comments
+ Mridul Muralidharan <mridul@gmail.com>
+ 2014-01-16 17:23:25 +0530
+ Commit: 1a0da89
+
+ Fixed Window spark shell launch script error. JIRA SPARK-1029:https://spark-project.atlassian.net/browse/SPARK-1029
+ Qiuzhuang Lian <Qiuzhuang.Lian@gmail.com>
+ 2014-01-16 16:09:10 +0800
+ Commit: 4e510b0
+
+ c06a307 2014-01-15 23:47:25 -0800
+ Merge pull request #445 from kayousterhout/exec_lost
+ [Fail rather than hanging if a task crashes the JVM.]
+
+ Updated unit test comment
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-01-15 23:46:14 -0800
+ Commit: 718a13c
+
+ 84595ea 2014-01-15 20:15:29 -0800
+ Merge pull request #414 from soulmachine/code-style
+ [Code clean up for mllib]
+
+ fix some format problem.
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-01-16 11:57:46 +0800
+ Commit: 8400536
+
+ fix "set MASTER automatically fails" bug.
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-01-16 11:45:02 +0800
+ Commit: 7a0c5b5
+
+ 0675ca5 2014-01-15 16:09:03 -0800
+ Merge pull request #439 from CrazyJvm/master
+ [SPARK-1024 Remove "-XX:+UseCompressedStrings" option from tuning guide]
+
+ Fail rather than hanging if a task crashes the JVM.
+ Kay Ousterhout <kayousterhout@gmail.com>
+ 2014-01-15 16:03:40 -0800
+ Commit: a268d63
+
+ 4f0c361 2014-01-15 14:25:45 -0800
+ Merge pull request #444 from mateiz/py-version
+ [Clarify that Python 2.7 is only needed for MLlib]
+
+ Clarify that Python 2.7 is only needed for MLlib
+ Matei Zaharia <matei@databricks.com>
+ 2014-01-15 14:20:39 -0800
+ Commit: 2ffdaef
+
+ 59f475c 2014-01-15 13:55:14 -0800
+ Merge pull request #442 from pwendell/standalone
+ [Workers should use working directory as spark home if it's not specified]
+
+ 2a05403 2014-01-15 13:54:45 -0800
+ Merge pull request #443 from tdas/filestream-fix
+ [Made some classes private[stremaing] and deprecated a method in JavaStreamingContext.]
+
+ Made some classes private[stremaing] and deprecated a method in JavaStreamingContext.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-15 12:15:46 -0800
+ Commit: 9e63753
+
+ 5fecd25 2014-01-15 11:15:07 -0800
+ Merge pull request #441 from pwendell/graphx-build
+ [GraphX shouldn't list Spark as provided.]
+
+ Workers should use working directory as spark home if it's not specified
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-15 10:58:02 -0800
+ Commit: 00a3f7e
+
+ GraphX shouldn't list Spark as provided
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-15 10:44:17 -0800
+ Commit: 9259d70
+
+ 494d3c0 2014-01-15 10:00:50 -0800
+ Merge pull request #433 from markhamstra/debFix
+ [Updated Debian packaging]
+
+ cef2af9 2014-01-15 10:06:17 -0600
+ Merge pull request #366 from colorant/yarn-dev
+ [More yarn code refactor]
+
+ remove "-XX:+UseCompressedStrings" option
+ CrazyJvm <crazyjvm@gmail.com>
+ 2014-01-15 22:26:15 +0800
+ Commit: 263933d
+
+ 3d9e66d 2014-01-14 23:17:05 -0800
+ Merge pull request #436 from ankurdave/VertexId-case
+ [Rename VertexID -> VertexId in GraphX]
+
+ Expose method and class - so that we can use it from user code (particularly since checkpoint directory is autogenerated now
+ Mridul Muralidharan <mridul@gmail.com>
+ 2014-01-15 12:44:44 +0530
+ Commit: 0aea33d
+
+ 139c24e 2014-01-14 23:07:55 -0800
+ Merge pull request #435 from tdas/filestream-fix
+ [Fixed the flaky tests by making SparkConf not serializable]
+
+ 087487e 2014-01-14 22:50:36 -0800
+ Merge pull request #434 from rxin/graphxmaven
+ [Fixed SVDPlusPlusSuite in Maven build.]
+
+ Merge remote-tracking branch 'apache/master' into filestream-fix
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-14 22:21:20 -0800
+ Commit: 0e15bd7
+
+ Changed SparkConf to not be serializable. And also fixed unit-test log paths in log4j.properties of external modules.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-01-14 22:20:14 -0800
+ Commit: 1f4718c
+
+ Fixed SVDPlusPlusSuite in Maven build.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 22:18:43 -0800
+ Commit: dfb1524
+
+ Removed repl-bin and updated maven build doc.
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-01-14 21:36:58 -0800
+ Commit: 147a943
+
+ VertexID -> VertexId
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-01-14 22:17:18 -0800
+ Commit: f4d9019
+
+ Add deb profile to assembly/pom.xml
+ Mark Hamstra <markhamstra@gmail.com>
+ 2014-01-14 21:23:09 -0800
+ Commit: 148757e
+
+ 3a386e2 2014-01-14 21:52:50 -0800
+ Merge pull request #424 from jegonzal/GraphXProgrammingGuide
+ [Additional edits for clarity in the graphx programming guide.]
+
+ ad294db 2014-01-14 21:51:06 -0800
+ Merge pull request #431 from ankurdave/graphx-caching-doc
+ [Describe caching and uncaching in GraphX programming guide]
+
+ Describe GraphX caching and uncaching in guide
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-01-14 17:24:25 -0800
+ Commit: 1210ec2
+
+ 74b46ac 2014-01-14 14:59:13 -0800
+ Merge pull request #428 from pwendell/writeable-objects
+ [Don't clone records for text files]
+
+ 193a075 2014-01-14 14:53:24 -0800
+ Merge pull request #429 from ankurdave/graphx-examples-pom.xml
+ [Add GraphX dependency to examples/pom.xml]
+
+ d601a76 2014-01-14 14:52:24 -0800
+ Merge pull request #427 from pwendell/deprecate-aggregator
+ [Deprecate rather than remove old combineValuesByKey function]
+
+ Add GraphX dependency to examples/pom.xml
+ Ankur Dave <ankurdave@gmail.com>
+ 2014-01-14 13:57:51 -0800
+ Commit: 8ea056d
+
+ Style fix
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-14 13:56:27 -0800
+ Commit: b1b22b7
+
+ Adding fix covering combineCombinersByKey as well
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-14 13:52:23 -0800
+ Commit: 8ea2cd5
+
+ 2ce23a5 2014-01-14 13:28:44 -0800
+ Merge pull request #425 from rxin/scaladoc
+ [API doc update & make Broadcast public]
+
+ Complain if Python and NumPy versions are too old for MLlib
+ Matei Zaharia <matei@databricks.com>
+ 2014-01-14 12:27:58 -0800
+ Commit: 5b3a3e2
+
+ Deprecate rather than remove old combineValuesByKey function
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-14 12:15:10 -0800
+ Commit: b683608
+
+ Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+)
+ Matei Zaharia <matei@databricks.com>
+ 2014-01-14 12:14:48 -0800
+ Commit: 938e4a0
+
+ Don't clone records for text files
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-14 11:57:53 -0800
+ Commit: 6f965a4
+
+ Fixed a typo in JavaSparkContext's API doc.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:42:28 -0800
+ Commit: f12e506
+
+ Maintain Serializable API compatibility by reverting back to java.io.Serializable for Broadcast and Accumulator.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:30:59 -0800
+ Commit: 1b5623f
+
+ Added license header for package.scala in the Java API package.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:20:12 -0800
+ Commit: 55db774
+
+ Added package doc for the Java API.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:16:25 -0800
+ Commit: f8c12e9
+
+ Updated API doc for Accumulable and Accumulator.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:16:08 -0800
+ Commit: 6a12b9e
+
+ Broadcast variable visibility change & doc update.
+ Reynold Xin <rxin@apache.org>
+ 2014-01-14 11:15:21 -0800
+ Commit: 71b3007
+
+ Additional edits for clarity in the graphx programming guide.
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-01-14 10:31:43 -0800
+ Commit: 0bba773
+
+ 3fcc68b 2014-01-14 09:44:43 -0800
+ Merge pull request #423 from jegonzal/GraphXProgrammingGuide
+ [Improving the graphx-programming-guide]
+
+ Improving the graphx-programming-guide.
+ Joseph E. Gonzalez <joseph.e.gonzalez@gmail.com>
+ 2014-01-14 09:40:06 -0800
+ Commit: 486f37c
+
+ Added parentheses for that getDouble() also has side effect
+ Frank Dai <soulmachine@gmail.com>
+ 2014-01-14 18:56:11 +0800
+ Commit: 57fcfc7
+
+ fa75e5e 2014-01-14 01:18:34 -0800
+ Merge pull request #420 from pwendell/header-files
+ [Add missing header files]
+
+ Add missing header files
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-01-14 01:14:20 -0800
+ Commit: 2303479
+
+ Modifications as suggested in PR feedback-
+ Saurabh Rawat <sr.eklavya@gmail.com>
+ 2014-01-14 14:19:02 +0530
+ Commit: 1442cd5
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-13 23:52:34 -0800
+ Commit: 845e568
+
+ Merge remote-tracking branch 'upstream/master' into code-style
+ Frank Dai <soulmachine@gmail.com>
+ 2014-01-14 15:29:17 +0800
+ Commit: a3da468
+
+ Indent two spaces
+ Frank Dai <soulmachine@gmail.com>
+ 2014-01-14 14:59:01 +0800
+ Commit: c2852cf
+
+ Since getLong() and getInt() have side effect, get back parentheses, and remove an empty line
+ Frank Dai <soulmachine@gmail.com>
+ 2014-01-14 14:53:10 +0800
+ Commit: 12386b3
+
+ Code clean up for mllib
+ Frank Dai <soulmachine@gmail.com>
+ 2014-01-14 14:37:26 +0800
+ Commit: 0d94d74
+
+ Address comments to fix code formats
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-01-10 09:44:44 +0800
+ Commit: 4c22c55
+
+ Yarn workerRunnable refactor
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-01-09 14:16:07 +0800
+ Commit: 161ab93
+
+ Yarn Client refactor
+ Raymond Liu <raymond.liu@intel.com>
+ 2014-01-09 09:53:50 +0800
+ Commit: 79a5ba3
+
+ Modifications as suggested in PR feedback-
+ Saurabh Rawat <sr.eklavya@gmail.com>
+ 2014-01-13 23:40:04 +0530
+ Commit: e922973
+
+ Remove default param from mapPartitions
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-13 18:13:22 +0530
+ Commit: fa42951
+
+ Remove classtag from mapPartitions.
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-13 18:09:58 +0530
+ Commit: 8fe562c
+
+ Added foreachPartition method to JavaRDD.
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-13 17:56:47 +0530
+ Commit: 6a65fee
+
+ Added mapPartitions method to JavaRDD.
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-13 17:56:10 +0530
+ Commit: dbadc6b
+
+ Added setter method setGenerator to JavaRDD.
+ eklavya <sr.eklavya@gmail.com>
+ 2014-01-13 17:53:35 +0530
+ Commit: aae8a01
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-11 13:27:15 -0800
+ Commit: f324d53
+
+ add dimension parameters to example
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-10 21:30:54 -0800
+ Commit: 1afdeae
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-09 22:45:32 -0800
+ Commit: 21c8a54
+
+ fix example
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-09 22:39:41 -0800
+ Commit: cf5bd4a
+
+ documentation for sparsematrix
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-07 17:19:28 -0800
+ Commit: 4f38b6f
+
+ More sparse matrix usage.
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-07 17:16:17 -0800
+ Commit: 7d7490b
+
+ fix docs to use SparseMatrix
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-05 18:03:57 -0800
+ Commit: 746148b
+
+ use SparseMatrix everywhere
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 14:28:07 -0800
+ Commit: 06c0f76
+
+ prettify
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 12:44:04 -0800
+ Commit: cdff9fc
+
+ new example file
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 12:33:22 -0800
+ Commit: e9bd6cb
+
+ fix tests
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 11:52:42 -0800
+ Commit: 8bfcce1
+
+ set methods
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 11:30:36 -0800
+ Commit: 35adc72
+
+ add k parameter
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 01:52:28 -0800
+ Commit: 73daa70
+
+ using decomposed matrix struct now
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 00:38:53 -0800
+ Commit: 26a74f0
+
+ new return struct
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-04 00:15:04 -0800
+ Commit: d2d5e5e
+
+ start using matrixentry
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-03 22:17:24 -0800
+ Commit: 7f631dd
+
+ rename sparsesvd.scala
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-03 21:55:38 -0800
+ Commit: 6bcdb76
+
+ New matrix entry file
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-03 21:54:57 -0800
+ Commit: b059a2a
+
+ fix error message
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-02 01:51:38 -0800
+ Commit: e617ae2
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-02 01:50:30 -0800
+ Commit: 6140578
+
+ more docs yay
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:22:29 -0800
+ Commit: 2612164
+
+ javadoc for sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:20:16 -0800
+ Commit: 915d53f
+
+ old version of spark_ec2
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:08:01 -0800
+ Commit: c868d71
+
+ remove accidental changes to ec2 script
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:05:03 -0800
+ Commit: 0c3797d
+
+ doc tweaks
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:03:47 -0800
+ Commit: 53ccf65
+
+ doc tweak
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:02:37 -0800
+ Commit: 97dc527
+
+ doc tweaks
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 20:01:13 -0800
+ Commit: b941b6f
+
+ tweaks to docs
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 19:53:14 -0800
+ Commit: 185c882
+
+ New documentation
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 19:53:04 -0800
+ Commit: dd0d3f0
+
+ Merge remote-tracking branch 'upstream/master' into sparsesvd
+ Reza Zadeh <rizlar@gmail.com>
+ 2014-01-01 18:12:35 -0800
+ Commit: 7c04b31
+
+ large scale considerations
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-27 04:15:13 -0500
+ Commit: ae5102a
+
+ initial large scale testing begin
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-27 01:51:19 -0500
+ Commit: 642ab5c
+
+ cleanup documentation
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-27 00:41:46 -0500
+ Commit: 3369c2d
+
+ add all tests
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-27 00:36:41 -0500
+ Commit: bdb5037
+
+ test for truncated svd
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-27 00:34:59 -0500
+ Commit: fa1e8d8
+
+ full rank matrix test added
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 23:21:57 -0500
+ Commit: 16de526
+
+ Main method added for svd
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 18:13:21 -0500
+ Commit: fe1a132
+
+ new main file
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 18:09:33 -0500
+ Commit: 1a21ba2
+
+ Object to hold the svd methods
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 17:39:25 -0500
+ Commit: 6c3674c
+
+ Some documentation
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 16:12:40 -0500
+ Commit: 6e740cc
+
+ Initial files - no tests
+ Reza Zadeh <rizlar@gmail.com>
+ 2013-12-26 15:01:03 -0500
+ Commit: 1a173f0
+
+
+Release 0.9.1
+
+ Revert "[maven-release-plugin] prepare release v0.9.1-rc2"
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-26 21:53:07 -0700
+ Commit: ea5da04
+
+ Revert "[maven-release-plugin] prepare for next development iteration"
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-26 21:51:40 -0700
+ Commit: d16e863
+
+ [SPARK-1327] GLM needs to check addIntercept for intercept and weights
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-26 19:30:57 -0700
+ Commit: 4901604, github.com/apache/spark/pull/236
+
+ SPARK-1322, top in pyspark should sort result in descending order.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-26 11:15:02 -0700
+ Commit: 2f90dc5, github.com/apache/spark/pull/235
+
+ [maven-release-plugin] prepare for next development iteration
+ Ubuntu <ubuntu@ip-172-31-18-245.us-west-2.compute.internal>
+ 2014-03-26 09:26:45 +0000
+ Commit: 1f785d4
+
+ [maven-release-plugin] prepare release v0.9.1-rc2
+ Ubuntu <ubuntu@ip-172-31-18-245.us-west-2.compute.internal>
+ 2014-03-26 09:26:40 +0000
+ Commit: 1197280
+
+ Updated CHANGES.txt
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-26 02:10:57 -0700
+ Commit: 7495dba
+
+ [SPARK-782] Made Spark use existing shaded ASM and removed Spark's ASM dependency
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-25 21:35:36 -0700
+ Commit: da87240, github.com/apache/spark/pull/232
+
+ Revert "[maven-release-plugin] prepare release v0.9.1-rc1"
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-25 15:01:52 -0700
+ Commit: 55abe72
+
+ Revert "[maven-release-plugin] prepare for next development iteration"
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-25 15:01:36 -0700
+ Commit: b94f997
+
+ [maven-release-plugin] prepare for next development iteration
+ Ubuntu <ubuntu@ip-172-31-18-245.us-west-2.compute.internal>
+ 2014-03-24 06:56:16 +0000
+ Commit: 12e237e
+
+ [maven-release-plugin] prepare release v0.9.1-rc1
+ Ubuntu <ubuntu@ip-172-31-18-245.us-west-2.compute.internal>
+ 2014-03-24 06:56:10 +0000
+ Commit: 81c6a06
+
+ Removed all occurences of incubator from all the pom.xml.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-23 23:31:59 -0700
+ Commit: 60ddb34
+
+ Updated CHANGES.txt file.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-23 13:16:50 -0700
+ Commit: f176b03
+
+ Fix to Stage UI to display numbers on progress bar
+ Emtiaz Ahmed <emtiazahmed@gmail.com>
+ 2014-03-21 18:07:05 -0700
+ Commit: 5e7ac0d, github.com/apache/spark/pull/201
+
+ SPARK-1284: Fix improper use of SimpleDateFormat
+ zsxwing <zsxwing@gmail.com>
+ 2014-03-21 16:39:23 -0700
+ Commit: 8856076, github.com/apache/spark/pull/179
+
+ [SPARK-1273] use doi links in mllib-guide
+ Xiangrui Meng <meng@databricks.com>
+ 2014-03-21 14:35:32 -0700
+ Commit: d68549e, github.com/apache/spark/pull/198
+
+ Removed incubating from Spark version in all the pom.xml.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-20 18:02:55 -0700
+ Commit: 8b1e793
+
+ Bumped versions to Spark 0.9.1
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-20 16:55:35 -0700
+ Commit: 8a882ef, github.com/apache/spark/pull/190
+
+ SPARK-1032. If Yarn app fails before registering, app master stays aroun...
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-20 16:50:44 -0500
+ Commit: c6630d3, github.com/apache/spark/pull/28
+
+ SPARK-1051. On YARN, executors don't doAs submitting user
+ Sandy Ryza <sandy@cloudera.com>
+ 2014-03-20 14:48:05 -0500
+ Commit: 748f002, github.com/apache/spark/pull/29
+
+ [SPARK-1285] Backporting updates to streaming docs to branch 0.9
+ Aaron Kimball <aaron@magnify.io>, Tathagata Das <tathagata.das1565@gmail.com>, Chen Chao <crazyjvm@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-03-20 12:27:47 -0700
+ Commit: 1e36690, github.com/apache/spark/pull/183
+
+ [SPARK-1273] MLlib bug fixes, improvements, and doc updates for v0.9.1
+ Xiangrui Meng <meng@databricks.com>, Sean Owen <sowen@cloudera.com>, Andrew Tulloch <andrew@tullo.ch>, Chen Chao <crazyjvm@gmail.com>
+ 2014-03-19 19:05:26 -0700
+ Commit: 1cc979e, github.com/apache/spark/pull/175
+
+ [SPARK-1275] Made dev/run-tests executable.
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-19 16:10:45 -0700
+ Commit: a4eef65, github.com/apache/spark/pull/178
+
+ Update the yarn alpha version to 0.9.1-incubating-SNAPSHOT
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-19 12:41:11 -0500
+ Commit: 72875b2
+
+ SPARK-1203 fix saving to hdfs from yarn
+ Thomas Graves <tgraves@apache.org>
+ 2014-03-19 08:19:47 -0500
+ Commit: 250ec27, github.com/apache/spark/pull/173
+
+ bugfix: Wrong "Duration" in "Active Stages" in stages page
+ shiyun.wxm <shiyun.wxm@taobao.com>
+ 2014-03-19 01:42:42 -0700
+ Commit: d385b5a, github.com/apache/spark/pull/170
+
+ [SPARK-1274] Add dev scripts to merge PRs and create releases from master to branch-0.9
+ Tathagata Das <tathagata.das1565@gmail.com>
+ 2014-03-18 22:09:16 -0700
+ Commit: 7ec78bc, github.com/apache/spark/pull/176
+
+ Bundle tachyon: SPARK-1269
+ Nick Lanham <nick@afternight.org>
+ 2014-03-18 22:05:18 -0700
+ Commit: 0183ddd, github.com/apache/spark/pull/137
+
+ [Spark-1261] add instructions for running python examples to doc overview page
+ Diana Carroll <dcarroll@cloudera.com>
+ 2014-03-17 17:37:03 -0700
+ Commit: 20d9458, github.com/apache/spark/pull/162
+
+ SPARK-1244: Throw exception if map output status exceeds frame size
+ Patrick Wendell <pwendell@gmail.com>, Andrew Or <andrewor14@gmail.com>
+ 2014-03-17 14:06:28 -0700
+ Commit: 4562140, github.com/apache/spark/pull/152
+
+ SPARK-1240: handle the case of empty RDD when takeSample
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-03-16 22:40:22 -0700
+ Commit: af7e8b1, github.com/apache/spark/pull/135
+
+ SPARK-977 Added Python RDD.zip function
+ Prabin Banka <prabin.banka@imaginea.com>
+ 2014-03-16 22:16:17 -0700
+ Commit: 1dc1e98, github.com/apache/spark/pull/76
+
+ Spark-1163, Added missing Python RDD functions
+ prabinb <prabin.banka@imaginea.com>
+ 2014-03-16 22:14:53 -0700
+ Commit: 249930a, github.com/apache/spark/pull/92
+
+ SPARK-1168, Added foldByKey to pyspark.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-16 22:13:33 -0700
+ Commit: 4480505, github.com/apache/spark/pull/115
+
+ Updated link for pyspark examples in docs
+ Jyotiska NK <jyotiska123@gmail.com>
+ 2014-03-16 22:12:51 -0700
+ Commit: e74e79a, github.com/apache/spark/pull/22
+
+ SPARK-1019: pyspark RDD take() throws an NPE
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-12 23:17:17 -0700
+ Commit: ef74e44, github.com/apache/spark/pull/112
+
+ Fix example bug: compile error
+ jianghan <jianghan@xiaomi.com>
+ 2014-03-12 19:46:48 -0700
+ Commit: 87e4dd5, github.com/apache/spark/pull/132
+
+ SPARK-1162 Added top in python.
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-12 15:57:54 -0700
+ Commit: 51a77e9, github.com/apache/spark/pull/93
+
+ Version fix in pom file
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-11 14:48:01 -0700
+ Commit: 7049164
+
+ Log4j build fix on 0.9 branch
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-11 11:53:29 -0700
+ Commit: 6cbd580
+
+ SPARK-1167: Remove metrics-ganglia from default build due to LGPL issues...
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-11 11:24:21 -0700
+ Commit: 0c91927, github.com/apache/spark/pull/108
+
+ For outputformats that are Configurable, call setConf before sending data to them.
+ Bryn Keller <bryn.keller@intel.com>
+ 2014-03-09 17:47:46 -0700
+ Commit: 6f0db0a, github.com/apache/spark/pull/638
+
+ SPARK-1190: Do not initialize log4j if slf4j log4j backend is not being used
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-08 16:02:56 -0800
+ Commit: 0f0d044, github.com/apache/spark/pull/107
+
+ SPARK-1184: Update the distribution tar.gz to include spark-assembly jar
+ Mark Grover <mark@apache.org>
+ 2014-03-05 16:55:36 -0800
+ Commit: 0fc0fdb, github.com/apache/spark/pull/78
+
+ SPARK-1109 wrong API docs for pyspark map function
+ Prashant Sharma <prashant.s@imaginea.com>
+ 2014-03-04 15:33:00 -0800
+ Commit: 7ea89ec, github.com/apache/spark/pull/73
+
+ Add Jekyll tag to isolate "production-only" doc components. (0.9 version)
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-03-02 18:18:44 -0800
+ Commit: 267d96c, github.com/apache/spark/pull/57
+
+ Removed reference to incubation in Spark user docs.
+ Reynold Xin <rxin@apache.org>
+ 2014-02-27 21:14:18 -0800
+ Commit: f2bf44a, github.com/apache/spark/pull/2
+
+ [SPARK-1089] fix the regression problem on ADD_JARS in 0.9
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-26 23:42:53 -0800
+ Commit: bc5e7d7, github.com/apache/spark/pull/13
+
+ Removed reference to incubation in README.md.
+ Reynold Xin <rxin@apache.org>
+ 2014-02-26 16:53:56 -0800
+ Commit: 349764d, github.com/apache/spark/pull/1
+
+ SPARK-1115: Catch depickling errors
+ Bouke van der Bijl <boukevanderbijl@gmail.com>
+ 2014-02-26 14:53:30 -0800
+ Commit: 886a466, github.com/apache/incubator-spark/pull/644
+
+ SPARK-1135: fix broken anchors in docs
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-26 11:56:12 -0800
+ Commit: 6fe72dd, github.com/apache/spark/pull/3
+
+ Fix removal from shuffleToMapStage to search for a key-value pair with our stage instead of using our shuffleID.
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-24 17:01:21 -0800
+ Commit: 0661cdc
+
+ SPARK-1124: Fix infinite retries of reduce stage when a map stage failed
+ Matei Zaharia <matei@databricks.com>
+ 2014-02-24 17:00:47 -0800
+ Commit: 5e74b8e
+
+ [SPARK-1055] fix the SCALA_VERSION and SPARK_VERSION in docker file
+ CodingCat <zhunansjtu@gmail.com>, Nan Zhu <CodingCat@users.noreply.github.com>
+ 2014-02-22 15:39:41 -0800
+ Commit: 00db30c, github.com/apache/incubator-spark/pull/634
+
+ SPARK-1117: update accumulator docs
+ Xiangrui Meng <meng@databricks.com>
+ 2014-02-21 22:44:59 -0800
+ Commit: ed58742, github.com/apache/incubator-spark/pull/631
+
+ [SPARK-1113] External spilling - fix Int.MaxValue hash code collision bug
+ Andrew Or <andrewor14@gmail.com>
+ 2014-02-21 20:06:09 -0800
+ Commit: 84131fe, github.com/apache/incubator-spark/pull/624
+
+ MLLIB-25: Implicit ALS runs out of memory for moderately large numbers of features
+ Sean Owen <sowen@cloudera.com>
+ 2014-02-21 13:39:17 -0800
+ Commit: 998abae, github.com/apache/incubator-spark/pull/629
+
+ SPARK-1111: URL Validation Throws Error for HDFS URL's
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-02-21 11:12:38 -0800
+ Commit: b3fff96, github.com/apache/incubator-spark/pull/625
+
+ Super minor: Add require for mergeCombiners in combineByKey
+ Aaron Davidson <aaron@databricks.com>
+ 2014-02-20 16:46:29 -0800
+ Commit: 3c44ff4, github.com/apache/incubator-spark/pull/623
+
+ [SPARK-1105] fix site scala version error in docs
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-19 15:56:24 -0800
+ Commit: 289d761, github.com/apache/incubator-spark/pull/618
+
+ Revert "[SPARK-1105] fix site scala version error in doc"
+ Patrick Wendell <pwendell@gmail.com>
+ 2014-02-18 17:47:34 -0800
+ Commit: 7bde72e
+
+ [SPARK-1105] fix site scala version error in doc
+ CodingCat <zhunansjtu@gmail.com>
+ 2014-02-18 16:33:41 -0800
+ Commit: 0f0395c, github.com/apache/incubator-spark/pull/616
+
+ Worker registration logging fix
+ Andrew Ash <andrew@andrewash.com>
+ 2014-02-17 09:52:16 -0800
+ Commit: b0b5288, github.com/apache/incubator-spark/pull/608
+
+ fix for https://spark-project.atlassian.net/browse/SPARK-1052
+ Bijay Bisht <bijay.bisht@gmail.com>
+ 2014-02-16 16:52:57 -0800
+ Commit: e797c1a, github.com/apache/incubator-spark/pull/568
+
+ Add c3 instance types to Spark EC2
+ Christian Lundgren <christian.lundgren@gameanalytics.com>
+ 2014-02-13 12:44:21 -0800
+ Commit: 19b4bb2, github.com/apache/incubator-spark/pull/595
+
+ SPARK-1088: Create a script for running tests so we can have version specific testing on Jenkins (branch-0.9)
+ Reynold Xin <rxin@apache.org>
+ 2014-02-12 23:42:58 -0800
+ Commit: e5b86b1, github.com/apache/incubator-spark/pull/593
+
+ Ported hadoopClient jar for < 1.0.1 fix
+ Bijay Bisht <bijay.bisht@gmail.com>
+ 2014-02-12 23:42:10 -0800
+ Commit: 8093de1, github.com/apache/incubator-spark/pull/584
+
+ 754bc18 2014-02-12 14:26:39 -0800
+ Merge pull request #590 from rxin/scalastyle.
+ [SPARK-1085: Fix Jenkins pull request builder for branch-0.9 (scalastyle command not found)]
+
+ 28f88c5 2014-02-11 22:43:09 -0800
+ Merge pull request #583 from colorant/zookeeper.
+ [Minor fix for ZooKeeperPersistenceEngine to use configured working dir]
+
+ e70690f 2014-02-09 23:33:35 -0800
+ Revert "Merge pull request #560 from pwendell/logging. Closes #560."
+ [This reverts commit 2e3d1c31db55c7f961e559e47bb497ae15cb74d7.]
+
+ de22abc 2014-02-08 23:37:05 -0800
+ Merge pull request #562 from jyotiska/master. Closes #562.
+ [Added example Python code for sort]
+
+ 2e3d1c3 2014-02-08 23:35:41 -0800
+ Merge pull request #560 from pwendell/logging. Closes #560.
+ [[WIP] SPARK-1067: Default log4j initialization causes errors for those not using log4j]
+
+ 22e0a3b 2014-02-08 13:00:07 -0800
+ Merge pull request #561 from Qiuzhuang/master. Closes #561.
+ [Kill drivers in postStop() for Worker.]
+
+ ce179f6 2014-02-06 22:06:30 -0800
+ Merge pull request #533 from andrewor14/master. Closes #533.
+ [External spilling - generalize batching logic]
+
+ 24e5298 2014-02-06 16:15:36 -0800
+ Merge pull request #450 from kayousterhout/fetch_failures. Closes #450.
+ [Only run ResubmitFailedStages event after a fetch fails]
+
+ 94896bb 2014-02-06 16:13:10 -0800
+ Merge pull request #321 from kayousterhout/ui_kill_fix. Closes #321.
+ [Inform DAG scheduler about all started/finished tasks.]
+
+ 44a2b03 2014-02-05 23:38:25 -0800
+ Merge pull request #545 from kayousterhout/fix_progress. Closes #545.
+ [Fix off-by-one error with task progress info log.]
+
+ b044b0b 2014-02-05 23:37:38 -0800
+ Merge pull request #526 from tgravescs/yarn_client_stop_am_fix. Closes #526.
+ [spark on yarn - yarn-client mode doesn't always exit immediately]
+
+ d815cfa 2014-02-04 09:47:25 -0800
+ Merge pull request #534 from sslavic/patch-1. Closes #534.
+ [Fixed wrong path to compute-classpath.cmd]
+
+ f3cba2d 2014-02-04 09:46:00 -0800
+ Merge pull request #535 from sslavic/patch-2. Closes #535.
+ [Fixed typo in scaladoc]
+
+ 5f63f32 2014-02-03 22:44:30 -0800
+ Merge pull request #449 from CrazyJvm/master
+ [SPARK-1028 : fix "set MASTER automatically fails" bug.]
+
+ 6e4d089 2014-02-03 22:42:43 -0800
+ Merge pull request #414 from soulmachine/code-style
+ [Code clean up for mllib]
+
+ 0021ef9 2014-02-03 22:42:01 -0800
+ Merge pull request #445 from kayousterhout/exec_lost
+ [Fail rather than hanging if a task crashes the JVM.]
+
+ dc8adf1 2014-02-03 22:41:30 -0800
+ Merge pull request #489 from ash211/patch-6
+ [Clarify spark.default.parallelism]
+
+ 574741f 2014-02-03 22:40:55 -0800
+ Merge pull request #493 from kayousterhout/double_add
+ [Fixed bug where task set managers are added to queue twice]
+
+ 1280e8a 2014-02-03 22:40:29 -0800
+ Merge pull request #511 from JoshRosen/SPARK-1040
+ [Fix ClassCastException in JavaPairRDD.collectAsMap() (SPARK-1040)]
+
+ 2c6c9b9 2014-02-03 22:39:59 -0800
+ Merge pull request #504 from JoshRosen/SPARK-1025
+ [Fix PySpark hang when input files are deleted (SPARK-1025)]
+
+ b10f607 2014-02-03 22:39:10 -0800
+ Merge pull request #516 from sarutak/master
+ [modified SparkPluginBuild.scala to use https protocol for accessing gith...]
+
+ 18520f5 2014-02-03 22:37:38 -0800
+ Merge pull request #490 from hsaputra/modify_checkoption_with_isdefined
+ [Replace the check for None Option with isDefined and isEmpty in Scala code]
+
+ a414071 2014-01-31 16:54:33 -0800
+ Merge pull request #524 from rxin/doc
+ [Added spark.shuffle.file.buffer.kb to configuration doc.]
+
+ a41a83c 2014-01-31 16:53:26 -0800
+ Merge pull request #527 from ankurdave/graphx-assembly-pom
+ [Add GraphX to assembly/pom.xml]
+
+ d18fe1f 2014-01-28 21:55:15 -0800
+ Merge pull request #497 from tdas/docs-update
+ [Updated Spark Streaming Programming Guide]
+
+ 5edbd17 2014-01-28 21:32:58 -0800
+ Merge pull request #523 from JoshRosen/SPARK-1043
+ [Switch from MUTF8 to UTF8 in PySpark serializers.]
+
+ [maven-release-plugin] prepare for next development iteration
+ Ubuntu <ubuntu@ip-10-109-132-81.ec2.internal>
+ 2014-01-24 06:15:15 +0000
+ Commit: 0f60ef2
+
+Release 0.9.0-incubating
+
+ d0a105d Thu Jan 23 20:53:31 2014 -0800
+ Merge pull request #505 from JoshRosen/SPARK-1026
+ [Deprecate mapPartitionsWithSplit in PySpark (SPARK-1026)]
+
+ e66d4c2 Thu Jan 23 19:47:16 2014 -0800
+ Merge pull request #503 from pwendell/master
+ [Fix bug on read-side of external sort when using Snappy.]
+
+ e8d3f2b Thu Jan 23 19:20:22 2014 -0800
+ Merge pull request #502 from pwendell/clone-1
+ [Remove Hadoop object cloning and warn users making Hadoop RDD's.]
+
+ 7a62353 Thu Jan 23 19:09:25 2014 -0800
+ Merge pull request #501 from JoshRosen/cartesian-rdd-fixes
+ [Fix two bugs in PySpark cartesian(): SPARK-978 and SPARK-1034]
+
+ 51960b8 Wed Jan 22 19:37:50 2014 -0800
+ Merge pull request #496 from pwendell/master
+ [Fix bug in worker clean-up in UI]
+
+ 828f7b4 Wed Jan 22 15:45:18 2014 -0800
+ Merge pull request #495 from srowen/GraphXCommonsMathDependency
+ [Fix graphx Commons Math dependency]
+
+ dc5857a Wed Jan 22 14:33:25 2014 -0800
+ Merge pull request #492 from skicavs/master
+ [fixed job name and usage information for the JavaSparkPi example]
+
+ dd533c9 Wed Jan 22 14:15:58 2014 -0800
+ Merge pull request #478 from sryza/sandy-spark-1033
+ [SPARK-1033. Ask for cores in Yarn container requests]
+
+ b6fd3cd Tue Jan 21 00:12:01 2014 -0800
+ Merge pull request #480 from pwendell/0.9-fixes
+ [Handful of 0.9 fixes]
+
+ e5f8917 Mon Jan 20 23:35:07 2014 -0800
+ Merge pull request #484 from tdas/run-example-fix
+ [Made run-example respect SPARK_JAVA_OPTS and SPARK_MEM.]
+
+ 410ba06 Mon Jan 20 22:26:14 2014 -0800
+ Merge pull request #482 from tdas/streaming-example-fix
+ [Added StreamingContext.awaitTermination to streaming examples]
+
+ f137947 Mon Jan 20 22:24:07 2014 -0800
+ Merge pull request #483 from pwendell/gitignore
+ [Restricting /lib to top level directory in .gitignore]
+
+ 94ae25d Sun Jan 19 11:33:51 2014 -0800
+ Merge pull request #470 from tgravescs/fix_spark_examples_yarn
+ [Only log error on missing jar to allow spark examples to jar.]
+
+ 0f077b5 Sun Jan 19 10:30:29 2014 -0800
+ Merge pull request #458 from tdas/docs-update
+ [Updated java API docs for streaming, along with very minor changes in the code examples.]
+
+ 03019d1 Sat Jan 18 16:29:43 2014 -0800
+ Merge pull request #459 from srowen/UpdaterL2Regularization
+ [Correct L2 regularized weight update with canonical form]
+
+ 76147a2 Sat Jan 18 16:24:16 2014 -0800
+ Merge pull request #437 from mridulm/master
+ [Minor api usability changes]
+
+ 4ac8cab Sat Jan 18 16:22:46 2014 -0800
+ Merge pull request #426 from mateiz/py-ml-tests
+ [Re-enable Python MLlib tests (require Python 2.7 and NumPy 1.7+)]
+
+ 34e911c Sat Jan 18 16:17:34 2014 -0800
+ Merge pull request #462 from mateiz/conf-file-fix
+ [Remove Typesafe Config usage and conf files to fix nested property names]
+
+ ff7201c Sat Jan 18 12:50:02 2014 -0800
+ Merge pull request #461 from pwendell/master
+ [Use renamed shuffle spill config in CoGroupedRDD.scala]
+
+ 7b0d5a5 Thu Jan 16 23:18:48 2014 -0800
+ Merge pull request #451 from Qiuzhuang/master
+ [Fixed Window spark shell launch script error.]
+
+ 4ccedb3 Wed Jan 15 14:26:48 2014 -0800
+ Merge pull request #444 from mateiz/py-version
+ [Clarify that Python 2.7 is only needed for MLlib]
+
+ e3fa36f Wed Jan 15 13:56:04 2014 -0800
+ Merge pull request #442 from pwendell/standalone
+ [Workers should use working directory as spark home if it's not specified]
+
+ 29c76d9 Wed Jan 15 13:55:48 2014 -0800
+ Merge pull request #443 from tdas/filestream-fix
+ [Made some classes private[stremaing] and deprecated a method in JavaStreamingContext.]
+
+ aca40aa Wed Jan 15 11:15:47 2014 -0800
+ Merge pull request #441 from pwendell/graphx-build
+ [GraphX shouldn't list Spark as provided.]
+
+ e12c374 Wed Jan 15 10:01:43 2014 -0800
+ Merge pull request #433 from markhamstra/debFix
+ [Updated Debian packaging]
+
+ 2f015c2 Tue Jan 14 23:17:28 2014 -0800
+ Merge pull request #436 from ankurdave/VertexId-case
+ [Rename VertexID -> VertexId in GraphX]
+
+ 2859cab Tue Jan 14 23:08:19 2014 -0800
+ Merge pull request #435 from tdas/filestream-fix
+ [Fixed the flaky tests by making SparkConf not serializable]
+
+ fbfbb33 Tue Jan 14 23:06:29 2014 -0800
+ Merge pull request #434 from rxin/graphxmaven
+ [Fixed SVDPlusPlusSuite in Maven build.]
+
+ 2c6c07f Tue Jan 14 21:53:05 2014 -0800
+ Merge pull request #424 from jegonzal/GraphXProgrammingGuide
+ [Additional edits for clarity in the graphx programming guide.]
+
+ 6fa4e02 Tue Jan 14 21:51:25 2014 -0800
+ Merge pull request #431 from ankurdave/graphx-caching-doc
+ [Describe caching and uncaching in GraphX programming guide]
+
+ 2f930d5 Tue Jan 14 15:00:11 2014 -0800
+ Merge pull request #428 from pwendell/writeable-objects
+ [Don't clone records for text files]
+
+ 329c9df Tue Jan 14 14:53:36 2014 -0800
+ Merge pull request #429 from ankurdave/graphx-examples-pom.xml
+ [Add GraphX dependency to examples/pom.xml]
+
+ a14933d Tue Jan 14 14:52:42 2014 -0800
+ Merge pull request #427 from pwendell/deprecate-aggregator
+ [Deprecate rather than remove old combineValuesByKey function]
+
+ 119b6c5 Tue Jan 14 13:29:08 2014 -0800
+ Merge pull request #425 from rxin/scaladoc
+ [API doc update & make Broadcast public]
+
+ bf3b150 Tue Jan 14 09:45:22 2014 -0800
+ Merge pull request #423 from jegonzal/GraphXProgrammingGuide
+ [Improving the graphx-programming-guide]
+
+ 1b4adc2 Tue Jan 14 01:19:24 2014 -0800
+ Merge pull request #420 from pwendell/header-files
+ [Add missing header files]
+
+ b60840e Tue Jan 14 00:48:34 2014 -0800
+ Merge pull request #418 from pwendell/0.9-versions
+ [Version changes for release 0.9.0.]
+
+ 980250b Tue Jan 14 00:05:37 2014 -0800
+ Merge pull request #416 from tdas/filestream-fix
+ [Removed unnecessary DStream operations and updated docs]
+
+ 055be5c Mon Jan 13 23:26:44 2014 -0800
+ Merge pull request #415 from pwendell/shuffle-compress
+ [Enable compression by default for spills]
+
+ fdaabdc Mon Jan 13 23:08:26 2014 -0800
+ Merge pull request #380 from mateiz/py-bayes
+ [Add Naive Bayes to Python MLlib, and some API fixes]
+
+ 4a805af Mon Jan 13 22:58:38 2014 -0800
+ Merge pull request #367 from ankurdave/graphx
+ [GraphX: Unifying Graphs and Tables]
+
+ 945fe7a Mon Jan 13 22:56:12 2014 -0800
+ Merge pull request #408 from pwendell/external-serializers
+ [Improvements to external sorting]
+
+ 68641bc Mon Jan 13 22:54:13 2014 -0800
+ Merge pull request #413 from rxin/scaladoc
+ [Adjusted visibility of various components and documentation for 0.9.0 release.]
+
+ 0ca0d4d Mon Jan 13 22:32:21 2014 -0800
+ Merge pull request #401 from andrewor14/master
+ [External sorting - Add number of bytes spilled to Web UI]
+
+ 08b9fec Mon Jan 13 22:29:03 2014 -0800
+ Merge pull request #409 from tdas/unpersist
+ [Automatically unpersisting RDDs that have been cleaned up from DStreams]
+
+ b07bc02 Mon Jan 13 20:45:22 2014 -0800
+ Merge pull request #412 from harveyfeng/master
+ [Add default value for HadoopRDD's `cloneRecords` constructor arg]
+
+ a2fee38 Mon Jan 13 19:45:26 2014 -0800
+ Merge pull request #411 from tdas/filestream-fix
+ [Improved logic of finding new files in FileInputDStream]
+
+ 01c0d72 Mon Jan 13 16:24:30 2014 -0800
+ Merge pull request #410 from rxin/scaladoc1
+ [Updated JavaStreamingContext to make scaladoc compile.]
+
+ 8038da2 Mon Jan 13 14:59:30 2014 -0800
+ Merge pull request #2 from jegonzal/GraphXCCIssue
+ [Improving documentation and identifying potential bug in CC calculation.]
+
+ b93f9d4 Mon Jan 13 12:18:05 2014 -0800
+ Merge pull request #400 from tdas/dstream-move
+ [Moved DStream and PairDSream to org.apache.spark.streaming.dstream]
+
+ e6ed13f Sun Jan 12 22:35:14 2014 -0800
+ Merge pull request #397 from pwendell/host-port
+ [Remove now un-needed hostPort option]
+
+ 0b96d85 Sun Jan 12 21:31:43 2014 -0800
+ Merge pull request #399 from pwendell/consolidate-off
+ [Disable shuffle file consolidation by default]
+
+ 0ab505a Sun Jan 12 21:31:04 2014 -0800
+ Merge pull request #395 from hsaputra/remove_simpleredundantreturn_scala
+ [Remove simple redundant return statements for Scala methods/functions]
+
+ 405bfe8 Sun Jan 12 20:04:21 2014 -0800
+ Merge pull request #394 from tdas/error-handling
+ [Better error handling in Spark Streaming and more API cleanup]
+
+ 28a6b0c Sun Jan 12 19:49:36 2014 -0800
+ Merge pull request #398 from pwendell/streaming-api
+ [Rename DStream.foreach to DStream.foreachRDD]
+
+ 074f502 Sun Jan 12 17:01:13 2014 -0800
+ Merge pull request #396 from pwendell/executor-env
+ [Setting load defaults to true in executor]
+
+ 82e2b92 Sun Jan 12 16:55:11 2014 -0800
+ Merge pull request #392 from rxin/listenerbus
+ [Stop SparkListenerBus daemon thread when DAGScheduler is stopped.]
+
+ 288a878 Sat Jan 11 21:53:19 2014 -0800
+ Merge pull request #389 from rxin/clone-writables
+ [Minor update for clone writables and more documentation.]
+
+ dbc11df Sat Jan 11 18:07:13 2014 -0800
+ Merge pull request #388 from pwendell/master
+ [Fix UI bug introduced in #244.]
+
+ 409866b Sat Jan 11 17:12:06 2014 -0800
+ Merge pull request #393 from pwendell/revert-381
+ [Revert PR 381]
+
+ 6510f04 Sat Jan 11 12:48:26 2014 -0800
+ Merge pull request #387 from jerryshao/conf-fix
+ [Fix configure didn't work small problem in ALS]
+
+ ee6e7f9 Sat Jan 11 12:07:55 2014 -0800
+ Merge pull request #359 from ScrapCodes/clone-writables
+ [We clone hadoop key and values by default and reuse objects if asked to.]
+
+ 4216178 Sat Jan 11 09:46:48 2014 -0800
+ Merge pull request #373 from jerryshao/kafka-upgrade
+ [Upgrade Kafka dependecy to 0.8.0 release version]
+
+ 92ad18b Fri Jan 10 23:25:15 2014 -0800
+ Merge pull request #376 from prabeesh/master
+ [Change clientId to random clientId]
+
+ 0b5ce7a Fri Jan 10 23:23:21 2014 -0800
+ Merge pull request #386 from pwendell/typo-fix
+ [Small typo fix]
+
+ 1d7bef0 Fri Jan 10 18:53:03 2014 -0800
+ Merge pull request #381 from mateiz/default-ttl
+ [Fix default TTL for metadata cleaner]
+
+ 44d6a8e Fri Jan 10 17:51:50 2014 -0800
+ Merge pull request #382 from RongGu/master
+ [Fix a type error in comment lines]
+
+ 88faa30 Fri Jan 10 17:14:22 2014 -0800
+ Merge pull request #385 from shivaram/add-i2-instances
+ [Add i2 instance types to Spark EC2.]
+
+ f265531 Fri Jan 10 16:25:44 2014 -0800
+ Merge pull request #383 from tdas/driver-test
+ [API for automatic driver recovery for streaming programs and other bug fixes]
+
+ d37408f Fri Jan 10 16:25:01 2014 -0800
+ Merge pull request #377 from andrewor14/master
+ [External Sorting for Aggregator and CoGroupedRDDs (Revisited)]
+
+ 0eaf01c Fri Jan 10 15:32:19 2014 -0800
+ Merge pull request #369 from pillis/master
+ [SPARK-961 Add a Vector.random() method]
+
+ 7cef843 Fri Jan 10 15:34:15 2014 -0600
+ Merge pull request #371 from tgravescs/yarn_client_addjar_misc_fixes
+ [Yarn client addjar and misc fixes]
+
+ 7b58f11 Fri Jan 10 12:47:46 2014 -0800
+ Merge pull request #384 from pwendell/debug-logs
+ [Make DEBUG-level logs consummable.]
+
+ 23d2995 Fri Jan 10 10:20:02 2014 -0800
+ Merge pull request #1 from jegonzal/graphx
+ [ProgrammingGuide]
+
+ 0ebc973 Thu Jan 9 23:58:49 2014 -0800
+ Merge pull request #375 from mateiz/option-fix
+ [Fix bug added when we changed AppDescription.maxCores to an Option]
+
+ dd03cea Thu Jan 9 23:38:03 2014 -0800
+ Merge pull request #378 from pwendell/consolidate_on
+ [Enable shuffle consolidation by default.]
+
+ 997c830 Thu Jan 9 22:22:20 2014 -0800
+ Merge pull request #363 from pwendell/streaming-logs
+ [Set default logging to WARN for Spark streaming examples.]
+
+ 300eaa9 Thu Jan 9 20:29:51 2014 -0800
+ Merge pull request #353 from pwendell/ipython-simplify
+ [Simplify and fix pyspark script.]
+
+ 4b074fa Thu Jan 9 19:03:55 2014 -0800
+ Merge pull request #374 from mateiz/completeness
+ [Add some missing Java API methods]
+
+ a9d5333 Thu Jan 9 18:46:46 2014 -0800
+ Merge pull request #294 from RongGu/master
+ [Bug fixes for updating the RDD block's memory and disk usage information]
+
+ d86a85e Thu Jan 9 18:37:52 2014 -0800
+ Merge pull request #293 from pwendell/standalone-driver
+ [SPARK-998: Support Launching Driver Inside of Standalone Mode]
+
+ 26cdb5f Thu Jan 9 17:16:34 2014 -0800
+ Merge pull request #372 from pwendell/log4j-fix-1
+ [Send logs to stderr by default (instead of stdout).]
+
+ 12f414e Thu Jan 9 15:31:30 2014 -0800
+ Merge pull request #362 from mateiz/conf-getters
+ [Use typed getters for configuration settings]
+
+ 365cac9 Thu Jan 9 00:56:16 2014 -0800
+ Merge pull request #361 from rxin/clean
+ [Minor style cleanup. Mostly on indenting & line width changes.]
+
+ 73c724e Thu Jan 9 00:32:19 2014 -0800
+ Merge pull request #368 from pwendell/sbt-fix
+ [Don't delegate to users `sbt`.]
+
+ dceedb4 Wed Jan 8 23:19:28 2014 -0800
+ Merge pull request #364 from pwendell/fix
+ [Fixing config option "retained_stages" => "retainedStages".]
+
+ 04d83fc Wed Jan 8 11:55:37 2014 -0800
+ Merge pull request #360 from witgo/master
+ [fix make-distribution.sh show version: command not found]
+
+ 56ebfea Wed Jan 8 11:50:06 2014 -0800
+ Merge pull request #357 from hsaputra/set_boolean_paramname
+ [Set boolean param name for call to SparkHadoopMapReduceUtil.newTaskAttemptID]
+
+ bdeaeaf Wed Jan 8 11:48:39 2014 -0800
+ Merge pull request #358 from pwendell/add-cdh
+ [Add CDH Repository to Maven Build]
+
+ 5cae05f Wed Jan 8 11:47:28 2014 -0800
+ Merge pull request #356 from hsaputra/remove_deprecated_cleanup_method
+ [Remove calls to deprecated mapred's OutputCommitter.cleanupJob]
+
+ 6eef78d Wed Jan 8 08:49:20 2014 -0600
+ Merge pull request #345 from colorant/yarn
+ [support distributing extra files to worker for yarn client mode]
+
+ bb6a39a Tue Jan 7 22:32:18 2014 -0800
+ Merge pull request #322 from falaki/MLLibDocumentationImprovement
+ [SPARK-1009 Updated MLlib docs to show how to use it in Python]
+
+ cb1b927 Tue Jan 7 22:26:28 2014 -0800
+ Merge pull request #355 from ScrapCodes/patch-1
+ [Update README.md]
+
+ c0f0155 Tue Jan 7 22:21:52 2014 -0800
+ Merge pull request #313 from tdas/project-refactor
+ [Refactored the streaming project to separate external libraries like Twitter, Kafka, Flume, etc.]
+
+ f5f12dc Tue Jan 7 21:56:35 2014 -0800
+ Merge pull request #336 from liancheng/akka-remote-lookup
+ [Get rid of `Either[ActorRef, ActorSelection]']
+
+ 11891e6 Wed Jan 8 00:32:18 2014 -0500
+ Merge pull request #327 from lucarosellini/master
+ [Added ‘-i’ command line option to Spark REPL]
+
+ 7d0aac9 Wed Jan 8 00:30:45 2014 -0500
+ Merge pull request #354 from hsaputra/addasfheadertosbt
+ [Add ASF header to the new sbt script.]
+
+ d75dc42 Wed Jan 8 00:30:03 2014 -0500
+ Merge pull request #350 from mateiz/standalone-limit
+ [Add way to limit default # of cores used by apps in standalone mode]
+
+ 61674bc Tue Jan 7 18:32:13 2014 -0800
+ Merge pull request #352 from markhamstra/oldArch
+ [Don't leave os.arch unset after BlockManagerSuite]
+
+ b2e690f Tue Jan 7 16:57:08 2014 -0800
+ Merge pull request #328 from falaki/MatrixFactorizationModel-fix
+ [SPARK-1012: DAGScheduler Exception Fix]
+
+ 6ccf8ce Tue Jan 7 15:49:14 2014 -0800
+ Merge pull request #351 from pwendell/maven-fix
+ [Add log4j exclusion rule to maven.]
+
+ 7d5fa17 Tue Jan 7 11:31:34 2014 -0800
+ Merge pull request #337 from yinxusen/mllib-16-bugfix
+ [Mllib 16 bugfix]
+
+ 71fc113 Tue Jan 7 11:30:35 2014 -0800
+ Merge pull request #349 from CodingCat/support-worker_dir
+ [add the comments about SPARK_WORKER_DIR]
+
+ 15d9534 Tue Jan 7 08:10:02 2014 -0800
+ Merge pull request #318 from srowen/master
+ [Suggested small changes to Java code for slightly more standard style, encapsulation and in some cases performance]
+
+ 468af0f Tue Jan 7 08:09:01 2014 -0800
+ Merge pull request #348 from prabeesh/master
+ [spark -> org.apache.spark]
+
+ c3cf047 Tue Jan 7 00:54:25 2014 -0800
+ Merge pull request #339 from ScrapCodes/conf-improvements
+ [Conf improvements]
+
+ a862caf Tue Jan 7 00:18:20 2014 -0800
+ Merge pull request #331 from holdenk/master
+ [Add a script to download sbt if not present on the system]
+
+ b97ef21 Mon Jan 6 20:12:57 2014 -0800
+ Merge pull request #346 from sproblvem/patch-1
+ [Update stop-slaves.sh]
+
+ 7210257 Mon Jan 6 18:25:44 2014 -0800
+ Merge pull request #128 from adamnovak/master
+ [Fix failing "sbt/sbt publish-local" by adding a no-argument PrimitiveKeyOpenHashMap constructor ]
+
+ e4d6057 Mon Jan 6 14:56:54 2014 -0800
+ Merge pull request #343 from pwendell/build-fix
+ [Fix test breaking downstream builds]
+
+ 93bf962 Mon Jan 6 11:42:41 2014 -0800
+ Merge pull request #340 from ScrapCodes/sbt-fixes
+ [Made java options to be applied during tests so that they become self explanatory.]
+
+ 60edeb3 Mon Jan 6 11:40:32 2014 -0800
+ Merge pull request #338 from ScrapCodes/ning-upgrade
+ [SPARK-1005 Ning upgrade]
+
+ c708e81 Mon Jan 6 11:35:48 2014 -0800
+ Merge pull request #341 from ash211/patch-5
+ [Clarify spark.cores.max in docs]
+
+ 33fcb91 Mon Jan 6 11:19:23 2014 -0800
+ Merge pull request #342 from tgravescs/fix_maven_protobuf
+ [Change protobuf version for yarn alpha back to 2.4.1]
+
+ 357083c Mon Jan 6 10:29:04 2014 -0800
+ Merge pull request #330 from tgravescs/fix_addjars_null_handling
+ [Fix handling of empty SPARK_EXAMPLES_JAR]
+
+ a2e7e04 Sun Jan 5 22:37:36 2014 -0800
+ Merge pull request #333 from pwendell/logging-silence
+ [Quiet ERROR-level Akka Logs]
+
+ 5b0986a Sun Jan 5 19:25:09 2014 -0800
+ Merge pull request #334 from pwendell/examples-fix
+ [Removing SPARK_EXAMPLES_JAR in the code]
+
+ f4b924f Sun Jan 5 17:11:47 2014 -0800
+ Merge pull request #335 from rxin/ser
+ [Fall back to zero-arg constructor for Serializer initialization if there is no constructor that accepts SparkConf.]
+
+ d43ad3e Sat Jan 4 16:29:30 2014 -0800
+ Merge pull request #292 from soulmachine/naive-bayes
+ [standard Naive Bayes classifier]
+
+ 86404da Sat Jan 4 14:55:54 2014 -0800
+ Merge pull request #127 from jegonzal/MapByPartition
+ [Adding mapEdges and mapTriplets by Partition]
+
+ e68cdb1 Sat Jan 4 13:46:02 2014 -0800
+ Merge pull request #124 from jianpingjwang/master
+ [refactor and bug fix]
+
+ 280ddf6 Sat Jan 4 12:54:41 2014 -0800
+ Merge pull request #121 from ankurdave/more-simplify
+ [Simplify GraphImpl internals further]
+
+ 10fe23b Fri Jan 3 23:50:14 2014 -0800
+ Merge pull request #329 from pwendell/remove-binaries
+ [SPARK-1002: Remove Binaries from Spark Source]
+
+ c4d6145 Fri Jan 3 16:30:53 2014 -0800
+ Merge pull request #325 from witgo/master
+ [Modify spark on yarn to create SparkConf process]
+
+ 4ae101f Fri Jan 3 11:24:35 2014 -0800
+ Merge pull request #317 from ScrapCodes/spark-915-segregate-scripts
+ [Spark-915 segregate scripts]
+
+ 87248bd Fri Jan 3 00:45:31 2014 -0800
+ Merge pull request #1 from apache/master
+ [Merge latest Spark changes]
+
+ 30b9db0 Thu Jan 2 23:15:55 2014 -0800
+ Merge pull request #285 from colorant/yarn-refactor
+ [Yarn refactor]
+
+ 498a5f0 Thu Jan 2 19:06:40 2014 -0800
+ Merge pull request #323 from tgravescs/sparkconf_yarn_fix
+ [fix spark on yarn after the sparkConf changes]
+
+ 0475ca8 Thu Jan 2 15:17:08 2014 -0800
+ Merge pull request #320 from kayousterhout/erroneous_failed_msg
+ [Remove erroneous FAILED state for killed tasks.]
+
+ 588a169 Thu Jan 2 13:20:54 2014 -0800
+ Merge pull request #297 from tdas/window-improvement
+ [Improvements to DStream window ops and refactoring of Spark's CheckpointSuite]
+
+ 5e67cdc Thu Jan 2 12:56:28 2014 -0800
+ Merge pull request #319 from kayousterhout/remove_error_method
+ [Removed redundant TaskSetManager.error() function.]
+
+ ca67909 Thu Jan 2 15:54:54 2014 -0500
+ Merge pull request #311 from tmyklebu/master
+ [SPARK-991: Report information gleaned from a Python stacktrace in the UI]
+
+ 3713f81 Wed Jan 1 21:29:12 2014 -0800
+ Merge pull request #309 from mateiz/conf2
+ [SPARK-544. Migrate configuration to a SparkConf class]
+
+ c1d928a Wed Jan 1 17:03:48 2014 -0800
+ Merge pull request #312 from pwendell/log4j-fix-2
+ [SPARK-1008: Logging improvments]
+
+ dc9cb83 Wed Jan 1 13:28:34 2014 -0800
+ Merge pull request #126 from jegonzal/FixingPersist
+ [Fixing Persist Behavior]
+
+ 9a0ff72 Tue Dec 31 21:50:24 2013 -0800
+ Merge pull request #314 from witgo/master
+ [restore core/pom.xml file modification]
+
+ 8b8e70e Tue Dec 31 17:48:24 2013 -0800
+ Merge pull request #73 from falaki/ApproximateDistinctCount
+ [Approximate distinct count]
+
+ 63b411d Tue Dec 31 14:31:28 2013 -0800
+ Merge pull request #238 from ngbinh/upgradeNetty
+ [upgrade Netty from 4.0.0.Beta2 to 4.0.13.Final]
+
+ 32d6ae9 Tue Dec 31 13:51:07 2013 -0800
+ Merge pull request #120 from ankurdave/subgraph-reuses-view
+ [Reuse VTableReplicated in GraphImpl.subgraph]
+
+ 55b7e2f Tue Dec 31 10:12:51 2013 -0800
+ Merge pull request #289 from tdas/filestream-fix
+ [Bug fixes for file input stream and checkpointing]
+
+ 2b71ab9 Mon Dec 30 11:01:30 2013 -0800
+ Merge pull request from aarondav: Utilize DiskBlockManager pathway for temp file writing
+ [This gives us a couple advantages:]
+
+ 50e3b8e Mon Dec 30 07:44:26 2013 -0800
+ Merge pull request #308 from kayousterhout/stage_naming
+ [Changed naming of StageCompleted event to be consistent]
+
+ 72a17b6 Sat Dec 28 21:25:40 2013 -1000
+ Revert "Merge pull request #310 from jyunfan/master"
+ [This reverts commit 79b20e4dbe3dcd8559ec8316784d3334bb55868b, reversing]
+
+ 79b20e4 Sat Dec 28 21:13:36 2013 -1000
+ Merge pull request #310 from jyunfan/master
+ [Fix typo in the Accumulators section]
+
+ 7375047 Sat Dec 28 13:25:06 2013 -0800
+ Merge pull request #304 from kayousterhout/remove_unused
+ [Removed unused failed and causeOfFailure variables (in TaskSetManager)]
+
+ ad3dfd1 Fri Dec 27 22:10:14 2013 -0500
+ Merge pull request #307 from kayousterhout/other_failure
+ [Removed unused OtherFailure TaskEndReason.]
+
+ b579b83 Fri Dec 27 22:09:04 2013 -0500
+ Merge pull request #306 from kayousterhout/remove_pending
+ [Remove unused hasPendingTasks methods]
+
+ 19672dc Fri Dec 27 13:37:10 2013 -0800
+ Merge pull request #305 from kayousterhout/line_spacing
+ [Fixed >100char lines in DAGScheduler.scala]
+
+ 7be1e57 Thu Dec 26 23:41:40 2013 -1000
+ Merge pull request #298 from aarondav/minor
+ [Minor: Decrease margin of left side of Log page]
+
+ 7d811ba Thu Dec 26 23:39:58 2013 -1000
+ Merge pull request #302 from pwendell/SPARK-1007
+ [SPARK-1007: spark-class2.cmd should change SCALA_VERSION to be 2.10]
+
+ 5e69fc5 Thu Dec 26 19:10:39 2013 -0500
+ Merge pull request #295 from markhamstra/JobProgressListenerNPE
+ [Avoid a lump of coal (NPE) in JobProgressListener's stocking.]
+
+ da20270 Thu Dec 26 12:11:52 2013 -0800
+ Merge pull request #1 from aarondav/driver
+ [Refactor DriverClient to be more Actor-based]
+
+ e240bad Thu Dec 26 12:30:48 2013 -0500
+ Merge pull request #296 from witgo/master
+ [Renamed ClusterScheduler to TaskSchedulerImpl for yarn and new-yarn package]
+
+ c344ed0 Thu Dec 26 01:31:06 2013 -0500
+ Merge pull request #283 from tmyklebu/master
+ [Python bindings for mllib]
+
+ 56094bc Wed Dec 25 13:14:33 2013 -0500
+ Merge pull request #290 from ash211/patch-3
+ [Typo: avaiable -> available]
+
+ 4842a07 Wed Dec 25 01:52:15 2013 -0800
+ Merge pull request #287 from azuryyu/master
+ [Fixed job name in the java streaming example.]
+
+ 85a344b Tue Dec 24 16:35:06 2013 -0800
+ Merge pull request #127 from kayousterhout/consolidate_schedulers
+ [Deduplicate Local and Cluster schedulers.]
+
+ c2dd6bc Tue Dec 24 14:36:47 2013 -0800
+ Merge pull request #279 from aarondav/shuffle-cleanup0
+ [Clean up shuffle files once their metadata is gone]
+
+ 3bf7c70 Tue Dec 24 16:37:13 2013 -0500
+ Merge pull request #275 from ueshin/wip/changeclasspathorder
+ [Change the order of CLASSPATH.]
+
+ d63856c Mon Dec 23 22:07:26 2013 -0800
+ Merge pull request #286 from rxin/build
+ [Show full stack trace and time taken in unit tests.]
+
+ 23a9ae6 Tue Dec 24 00:08:48 2013 -0500
+ Merge pull request #277 from tdas/scheduler-update
+ [Refactored the streaming scheduler and added StreamingListener interface]
+
+ 11107c9 Mon Dec 23 10:38:20 2013 -0800
+ Merge pull request #244 from leftnoteasy/master
+ [Added SPARK-968 implementation for review]
+
+ 44e4205 Sun Dec 22 11:44:18 2013 -0800
+ Merge pull request #116 from jianpingjwang/master
+ [remove unused variables and fix a bug]
+
+ 4797c22 Fri Dec 20 13:30:39 2013 -0800
+ Merge pull request #118 from ankurdave/VertexPartitionSuite
+ [Test VertexPartition and fix bugs]
+
+ 0bc57c5 Fri Dec 20 11:56:54 2013 -0800
+ Merge pull request #280 from aarondav/minor
+ [Minor cleanup for standalone scheduler]
+
+ ac70b8f Fri Dec 20 10:56:10 2013 -0800
+ Merge pull request #117 from ankurdave/more-tests
+ [More tests]
+
+ 45310d4 Thu Dec 19 22:08:20 2013 -0800
+ Merge pull request #115 from ankurdave/test-reorg
+ [Reorganize unit tests; improve GraphSuite test coverage]
+
+ 9228ec8 Thu Dec 19 21:37:15 2013 -0800
+ Merge pull request #1 from aarondav/127
+ [Merge master into 127]
+
+ eca68d4 Thu Dec 19 18:12:22 2013 -0800
+ Merge pull request #272 from tmyklebu/master
+ [Track and report task result serialisation time.]
+
+ 7990c56 Thu Dec 19 13:35:09 2013 -0800
+ Merge pull request #276 from shivaram/collectPartition
+ [Add collectPartition to JavaRDD interface.]
+
+ 440e531 Thu Dec 19 10:38:56 2013 -0800
+ Merge pull request #278 from MLnick/java-python-tostring
+ [Add toString to Java RDD, and __repr__ to Python RDD]
+
+ d8d3f3e Thu Dec 19 00:06:43 2013 -0800
+ Merge pull request #183 from aarondav/spark-959
+ [[SPARK-959] Explicitly depend on org.eclipse.jetty.orbit jar]
+
+ bfba532 Wed Dec 18 22:22:21 2013 -0800
+ Merge pull request #247 from aarondav/minor
+ [Increase spark.akka.askTimeout default to 30 seconds]
+
+ da301b5 Wed Dec 18 20:03:29 2013 -0800
+ Merge pull request #112 from amatsukawa/scc
+ [Strongly connected component algorithm]
+
+ c64a53a Wed Dec 18 16:56:26 2013 -0800
+ Merge pull request #267 from JoshRosen/cygwin
+ [Fix Cygwin support in several scripts.]
+
+ a645ef6 Wed Dec 18 16:07:52 2013 -0800
+ Merge pull request #48 from amatsukawa/add_project_to_graph
+ [Add mask operation on graph and filter graph primitive]
+
+ d7ebff0 Wed Dec 18 15:38:48 2013 -0800
+ Merge pull request #1 from ankurdave/add_project_to_graph
+ [Merge current master and reimplement Graph.mask using innerJoin]
+
+ 5ea1872 Wed Dec 18 15:27:24 2013 -0800
+ Merge pull request #274 from azuryy/master
+ [Fixed the example link in the Scala programing guid.]
+
+ 3fd2e09 Wed Dec 18 12:52:36 2013 -0800
+ Merge pull request #104 from jianpingjwang/master
+ [SVD++ demo]
+
+ f4effb3 Tue Dec 17 22:26:21 2013 -0800
+ Merge pull request #273 from rxin/top
+ [Fixed a performance problem in RDD.top and BoundedPriorityQueue]
+
+ 1b5eacb Tue Dec 17 13:49:17 2013 -0800
+ Merge pull request #102 from ankurdave/clustered-edge-index
+ [Add clustered index on edges by source vertex]
+
+ 7a8169b Mon Dec 16 22:42:21 2013 -0800
+ Merge pull request #268 from pwendell/shaded-protobuf
+ [Add support for 2.2. to master (via shaded jars)]
+
+ 0476c84 Mon Dec 16 17:19:25 2013 -0800
+ Merge pull request #100 from ankurdave/mrTriplets-active-set
+ [Support activeSet option in mapReduceTriplets]
+
+ 964a3b6 Mon Dec 16 15:23:51 2013 -0800
+ Merge pull request #270 from ewencp/really-force-ssh-pseudo-tty-master
+ [Force pseudo-tty allocation in spark-ec2 script.]
+
+ 5192ef3 Mon Dec 16 15:08:08 2013 -0800
+ Merge pull request #94 from ankurdave/load-edges-columnar
+ [Load edges in columnar format]
+
+ 883e034 Mon Dec 16 14:16:02 2013 -0800
+ Merge pull request #245 from gregakespret/task-maxfailures-fix
+ [Fix for spark.task.maxFailures not enforced correctly.]
+
+ a51f340 Sun Dec 15 22:02:30 2013 -0800
+ Merge pull request #265 from markhamstra/scala.binary.version
+ [DRY out the POMs with scala.binary.version]
+
+ ded10ce Sun Dec 15 17:25:33 2013 -0800
+ Merge pull request #103 from amplab/optimizations
+ [Optimizations cherry-picked from SIGMOD branches]
+
+ d2ced6d Sun Dec 15 14:11:34 2013 -0800
+ Merge pull request #256 from MLnick/master
+ [Fix 'IPYTHON=1 ./pyspark' throwing ValueError]
+
+ c55e698 Sun Dec 15 12:49:02 2013 -0800
+ Merge pull request #257 from tgravescs/sparkYarnFixName
+ [Fix the --name option for Spark on Yarn]
+
+ ab85f88 Sun Dec 15 12:48:32 2013 -0800
+ Merge pull request #264 from shivaram/spark-class-fix
+ [Use CoarseGrainedExecutorBackend in spark-class]
+
+ 8a56c1f Sat Dec 14 16:29:24 2013 -0800
+ Merge pull request #84 from amatsukawa/graphlab_enhancements
+ [GraphLab bug fix & set start vertex]
+
+ 7db9165 Sat Dec 14 14:16:34 2013 -0800
+ Merge pull request #251 from pwendell/master
+ [Fix list rendering in YARN markdown docs.]
+
+ 2fd781d Sat Dec 14 12:59:37 2013 -0800
+ Merge pull request #249 from ngbinh/partitionInJavaSortByKey
+ [Expose numPartitions parameter in JavaPairRDD.sortByKey()]
+
+ 9bf192b Sat Dec 14 12:52:18 2013 -0800
+ Merge pull request #91 from amplab/standalone-pagerank
+ [Standalone PageRank]
+
+ 840af5e Sat Dec 14 12:51:51 2013 -0800
+ Merge pull request #99 from ankurdave/only-dynamic-pregel
+ [Remove static Pregel; take maxIterations in dynamic Pregel]
+
+ 97ac060 Sat Dec 14 00:22:45 2013 -0800
+ Merge pull request #259 from pwendell/scala-2.10
+ [Migration to Scala 2.10]
+
+ 7ac944f Fri Dec 13 23:22:08 2013 -0800
+ Merge pull request #262 from pwendell/mvn-fix
+ [Fix maven build issues in 2.10 branch]
+
+ 6defb06 Fri Dec 13 21:18:57 2013 -0800
+ Merge pull request #261 from ScrapCodes/scala-2.10
+ [Added a comment about ActorRef and ActorSelection difference.]
+
+ 76566b1 Fri Dec 13 10:11:02 2013 -0800
+ Merge pull request #260 from ScrapCodes/scala-2.10
+ [Review comments on the PR for scala 2.10 migration.]
+
+ 0aeb182 Thu Dec 12 21:14:42 2013 -0800
+ Merge pull request #255 from ScrapCodes/scala-2.10
+ [Disabled yarn 2.2 in sbt and mvn build and added a message in the sbt build.]
+
+ 2e89398 Wed Dec 11 23:10:53 2013 -0800
+ Merge pull request #254 from ScrapCodes/scala-2.10
+ [Scala 2.10 migration]
+
+ ce6ca4e Wed Dec 11 22:30:54 2013 -0800
+ Merge pull request #97 from dcrankshaw/fix-rddtop
+ [Added BoundedPriorityQueue kryo registrator. Fixes top issue.]
+
+ d2efe13 Tue Dec 10 13:01:26 2013 -0800
+ Merge pull request #250 from pwendell/master
+ [README incorrectly suggests build sources spark-env.sh]
+
+ 6169fe1 Mon Dec 9 16:51:36 2013 -0800
+ Merge pull request #246 from pwendell/master
+ [Add missing license headers]
+
+ d992ec6 Sun Dec 8 20:49:20 2013 -0800
+ Merge pull request #195 from dhardy92/fix_DebScriptPackage
+ [[Deb] fix package of Spark classes adding org.apache prefix in scripts embeded in .deb]
+
+ 1f4a4bc Sat Dec 7 22:34:34 2013 -0800
+ Merge pull request #242 from pwendell/master
+ [Update broken links and add HDP 2.0 version string]
+
+ 6494d62 Sat Dec 7 11:56:16 2013 -0800
+ Merge pull request #240 from pwendell/master
+ [SPARK-917 Improve API links in nav bar]
+
+ f466f79 Sat Dec 7 11:51:52 2013 -0800
+ Merge pull request #239 from aarondav/nit
+ [Correct spellling error in configuration.md]
+
+ 3abfbfb Sat Dec 7 11:24:19 2013 -0800
+ Merge pull request #92 from ankurdave/rdd-names
+ [Set RDD names for easy debugging]
+
+ 31e8a14 Fri Dec 6 21:49:55 2013 -0800
+ Merge pull request #90 from amplab/pregel-replicate-changed
+ [Replicate only changed vertices]
+
+ 10c3c0c Fri Dec 6 20:29:45 2013 -0800
+ Merge pull request #237 from pwendell/formatting-fix
+ [Formatting fix]
+
+ 1b38f5f Fri Dec 6 20:16:15 2013 -0800
+ Merge pull request #236 from pwendell/shuffle-docs
+ [Adding disclaimer for shuffle file consolidation]
+
+ e5d5728 Fri Dec 6 20:14:56 2013 -0800
+ Merge pull request #235 from pwendell/master
+ [Minor doc fixes and updating README]
+
+ 241336a Fri Dec 6 17:29:03 2013 -0800
+ Merge pull request #234 from alig/master
+ [Updated documentation about the YARN v2.2 build process]
+
+ e039234 Fri Dec 6 11:49:59 2013 -0800
+ Merge pull request #190 from markhamstra/Stages4Jobs
+ [stageId <--> jobId mapping in DAGScheduler]
+
+ bfa6860 Fri Dec 6 11:04:03 2013 -0800
+ Merge pull request #233 from hsaputra/changecontexttobackend
+ [Change the name of input argument in ClusterScheduler#initialize from context to backend.]
+
+ 3fb302c Fri Dec 6 11:03:32 2013 -0800
+ Merge pull request #205 from kayousterhout/logging
+ [Added logging of scheduler delays to UI]
+
+ 87676a6 Fri Dec 6 11:01:42 2013 -0800
+ Merge pull request #220 from rxin/zippart
+ [Memoize preferred locations in ZippedPartitionsBaseRDD]
+
+ 0780498 Thu Dec 5 23:29:42 2013 -0800
+ Merge pull request #232 from markhamstra/FiniteWait
+ [jobWaiter.synchronized before jobWaiter.wait]
+
+ 1c8500e Thu Dec 5 16:25:44 2013 -0800
+ Merge pull request #88 from amplab/varenc
+ [Fixed a bug that variable encoding doesn't work for ints that use all 64 bits.]
+
+ e0bcaa0 Thu Dec 5 12:37:02 2013 -0800
+ Merge pull request #86 from ankurdave/vid-varenc
+ [Finish work on #85]
+
+ 5d46025 Thu Dec 5 12:31:24 2013 -0800
+ Merge pull request #228 from pwendell/master
+ [Document missing configs and set shuffle consolidation to false.]
+
+ 3e96b9a Thu Dec 5 12:07:36 2013 -0800
+ Merge pull request #85 from ankurdave/vid-varenc
+ [Always write Vids using variable encoding]
+
+ 72b6961 Wed Dec 4 23:33:04 2013 -0800
+ Merge pull request #199 from harveyfeng/yarn-2.2
+ [Hadoop 2.2 migration]
+
+ e0347ba Wed Dec 4 17:38:06 2013 -0800
+ Merge pull request #83 from ankurdave/fix-tests
+ [Fix compile errors in GraphSuite and SerializerSuite]
+
+ 182f9ba Wed Dec 4 15:52:07 2013 -0800
+ Merge pull request #227 from pwendell/master
+ [Fix small bug in web UI and minor clean-up.]
+
+ cbd3b75 Wed Dec 4 15:35:26 2013 -0800
+ Merge pull request #81 from amplab/clean1
+ [Codebase refactoring]
+
+ b9e7609 Wed Dec 4 14:42:09 2013 -0800
+ Merge pull request #225 from ash211/patch-3
+ [Add missing space after "Serialized" in StorageLevel]
+
+ 055462c Wed Dec 4 14:02:11 2013 -0800
+ Merge pull request #226 from ash211/patch-4
+ [Typo: applicaton]
+
+ d6e5473 Wed Dec 4 10:28:50 2013 -0800
+ Merge pull request #223 from rxin/transient
+ [Mark partitioner, name, and generator field in RDD as @transient.]
+
+ 8a3475a Tue Dec 3 14:21:40 2013 -0800
+ Merge pull request #218 from JoshRosen/spark-970-pyspark-unicode-error
+ [Fix UnicodeEncodeError in PySpark saveAsTextFile() (SPARK-970)]
+
+ 46b87b8 Tue Dec 3 00:41:11 2013 -0800
+ Merge pull request #2 from colorant/yarn-client-2.2
+ [Fix pom.xml for maven build]
+
+ 58d9bbc Mon Dec 2 21:58:53 2013 -0800
+ Merge pull request #217 from aarondav/mesos-urls
+ [Re-enable zk:// urls for Mesos SparkContexts]
+
+ 740922f Sun Dec 1 12:46:58 2013 -0800
+ Merge pull request #219 from sundeepn/schedulerexception
+ [Scheduler quits when newStage fails]
+
+ 60e23a5 Sat Nov 30 23:38:49 2013 -0800
+ Merge pull request #216 from liancheng/fix-spark-966
+ [Bugfix: SPARK-965 & SPARK-966]
+
+ 34ee814 Sat Nov 30 15:10:30 2013 -0800
+ Merged Ankur's pull request #80 and fixed subgraph.
+ []
+
+ 743a31a Wed Nov 27 18:24:39 2013 -0800
+ Merge pull request #210 from haitaoyao/http-timeout
+ [add http timeout for httpbroadcast]
+
+ 993e293 Wed Nov 27 00:57:54 2013 -0800
+ Merge pull request #1 from colorant/yarn-client-2.2
+ [Port yarn-client mode for new-yarn]
+
+ fb6875d Tue Nov 26 20:55:40 2013 -0800
+ Merge pull request #146 from JoshRosen/pyspark-custom-serializers
+ [Custom Serializers for PySpark]
+
+ 330ada1 Tue Nov 26 19:08:33 2013 -0800
+ Merge pull request #207 from henrydavidge/master
+ [Log a warning if a task's serialized size is very big]
+
+ 615213f Tue Nov 26 19:07:20 2013 -0800
+ Merge pull request #212 from markhamstra/SPARK-963
+ [[SPARK-963] Fixed races in JobLoggerSuite]
+
+ cb976df Tue Nov 26 10:23:19 2013 -0800
+ Merge pull request #209 from pwendell/better-docs
+ [Improve docs for shuffle instrumentation]
+
+ 18d6df0 Tue Nov 26 00:00:07 2013 -0800
+ Merge pull request #86 from holdenk/master
+ [Add histogram functionality to DoubleRDDFunctions]
+
+ 0e2109d Mon Nov 25 20:48:37 2013 -0800
+ Merge pull request #204 from rxin/hash
+ [OpenHashSet fixes]
+
+ c46067f Mon Nov 25 19:09:31 2013 -0800
+ Merge pull request #206 from ash211/patch-2
+ [Update tuning.md]
+
+ 14bb465 Mon Nov 25 18:50:18 2013 -0800
+ Merge pull request #201 from rxin/mappartitions
+ [Use the proper partition index in mapPartitionsWIthIndex]
+
+ eb4296c Mon Nov 25 15:25:29 2013 -0800
+ Merge pull request #101 from colorant/yarn-client-scheduler
+ [For SPARK-527, Support spark-shell when running on YARN]
+
+ 466fd06 Mon Nov 25 18:27:26 2013 +0800
+ Incorporated ideas from pull request #200. - Use Murmur Hash 3 finalization step to scramble the bits of HashCode instead of the simpler version in java.util.HashMap; the latter one had trouble with ranges of consecutive integers. Murmur Hash 3 is used by fastutil.
+ [- Don't check keys for equality when re-inserting due to growing the]
+
+ 088995f Mon Nov 25 00:57:51 2013 -0800
+ Merge pull request #77 from amplab/upgrade
+ [Sync with Spark master]
+
+ 62889c4 Mon Nov 25 11:27:45 2013 +0800
+ Merge pull request #203 from witgo/master
+ [ Fix Maven build for metrics-graphite]
+
+ 6af03ed Sun Nov 24 16:42:37 2013 -0800
+ Merge pull request #76 from dcrankshaw/fix_partitioners
+ [Actually use partitioner command line args in Analytics.]
+
+ 859d62d Sun Nov 24 16:19:51 2013 -0800
+ Merge pull request #151 from russellcardullo/add-graphite-sink
+ [Add graphite sink for metrics]
+
+ 65de73c Sun Nov 24 15:52:33 2013 -0800
+ Merge pull request #185 from mkolod/random-number-generator
+ [XORShift RNG with unit tests and benchmark]
+
+ 972171b Mon Nov 25 07:50:46 2013 +0800
+ Merge pull request #197 from aarondav/patrick-fix
+ [Fix 'timeWriting' stat for shuffle files]
+
+ a1a7e36 Sun Nov 24 05:15:09 2013 -0800
+ Merge pull request #75 from amplab/simplify
+ [Simplify GraphImpl internals]
+
+ 718cc80 Sun Nov 24 11:02:02 2013 +0800
+ Merge pull request #200 from mateiz/hash-fix
+ [AppendOnlyMap fixes]
+
+ 51aa9d6 Sat Nov 23 19:46:46 2013 +0800
+ Merge pull request #198 from ankurdave/zipPartitions-preservesPartitioning
+ [Support preservesPartitioning in RDD.zipPartitions]
+
+ 18ce7e9 Fri Nov 22 17:02:40 2013 -0800
+ Merge pull request #73 from jegonzal/TriangleCount
+ [Triangle count]
+
+ 086b097 Fri Nov 22 10:26:39 2013 +0800
+ Merge pull request #193 from aoiwelle/patch-1
+ [Fix Kryo Serializer buffer documentation inconsistency]
+
+ f20093c Fri Nov 22 10:12:13 2013 +0800
+ Merge pull request #196 from pwendell/master
+ [TimeTrackingOutputStream should pass on calls to close() and flush().]
+
+ 4b89501 Wed Nov 20 10:36:10 2013 -0800
+ Merge pull request #191 from hsaputra/removesemicolonscala
+ [Cleanup to remove semicolons (;) from Scala code]
+
+ 202f8e6 Wed Nov 20 03:26:08 2013 -0800
+ Merge pull request #74 from dcrankshaw/remove_sleep
+ [Removed sleep from pagerank in Analytics]
+
+ 74ade9e Tue Nov 19 16:53:58 2013 -0800
+ Merge pull request #62 from dcrankshaw/partitioners
+ [Allow user to choose a partitioner at runtime]
+
+ f568912 Tue Nov 19 16:11:31 2013 -0800
+ Merge pull request #181 from BlackNiuza/fix_tasks_number
+ [correct number of tasks in ExecutorsUI]
+
+ aa638ed Tue Nov 19 16:05:44 2013 -0800
+ Merge pull request #189 from tgravescs/sparkYarnErrorHandling
+ [Impove Spark on Yarn Error handling]
+
+ 5592580 Tue Nov 19 16:04:01 2013 -0800
+ Merge pull request #187 from aarondav/example-bcast-test
+ [Enable the Broadcast examples to work in a cluster setting]
+
+ 99cfe89 Mon Nov 18 22:00:36 2013 -0500
+ Updates to reflect pull request code review
+ []
+
+ e2ebc3a Sun Nov 17 18:42:18 2013 -0800
+ Merge pull request #182 from rxin/vector
+ [Slightly enhanced PrimitiveVector:]
+
+ 26f616d Sun Nov 17 18:18:16 2013 -0800
+ Merge pull request #3 from aarondav/pv-test
+ [Add PrimitiveVectorSuite and fix bug in resize()]
+
+ 1b5b358 Sat Nov 16 11:44:10 2013 -0800
+ Merge pull request #178 from hsaputra/simplecleanupcode
+ [Simple cleanup on Spark's Scala code]
+
+ 62a2a71 Fri Nov 15 13:12:07 2013 -0800
+ Merge pull request #65 from amplab/varenc
+ [Use variable encoding for ints, longs, and doubles in the specialized serializers.]
+
+ f6b2e59 Thu Nov 14 23:04:55 2013 -0800
+ Merge pull request #1 from aarondav/scala210-master
+ [Various merge corrections]
+
+ 96e0fb4 Thu Nov 14 22:29:28 2013 -0800
+ Merge pull request #173 from kayousterhout/scheduler_hang
+ [Fix bug where scheduler could hang after task failure.]
+
+ dfd40e9 Thu Nov 14 19:44:50 2013 -0800
+ Merge pull request #175 from kayousterhout/no_retry_not_serializable
+ [Don't retry tasks when they fail due to a NotSerializableException]
+
+ ed25105 Thu Nov 14 19:43:55 2013 -0800
+ Merge pull request #174 from ahirreddy/master
+ [Write Spark UI url to driver file on HDFS]
+
+ 1a4cfbe Thu Nov 14 10:32:11 2013 -0800
+ Merge pull request #169 from kayousterhout/mesos_fix
+ [Don't ignore spark.cores.max when using Mesos Coarse mode]
+
+ 5a4f483 Thu Nov 14 10:30:36 2013 -0800
+ Merge pull request #170 from liancheng/hadooprdd-doc-typo
+ [Fixed a scaladoc typo in HadoopRDD.scala]
+
+ d76f520 Thu Nov 14 10:25:48 2013 -0800
+ Merge pull request #171 from RIA-pierre-borckmans/master
+ [Fixed typos in the CDH4 distributions version codes.]
+
+ 2c39d80 Wed Nov 13 23:28:01 2013 -0800
+ Merge pull request #69 from jegonzal/MissingVertices
+ [Addressing issue in Graph creation]
+
+ 33b2dea Wed Nov 13 17:55:58 2013 -0800
+ Merge pull request #1 from ankurdave/MissingVertices
+ [During graph creation, create eTable earlier]
+
+ 2054c61 Wed Nov 13 16:49:55 2013 -0800
+ Merge pull request #159 from liancheng/dagscheduler-actor-refine
+ [Migrate the daemon thread started by DAGScheduler to Akka actor]
+
+ 9290e5b Wed Nov 13 16:48:44 2013 -0800
+ Merge pull request #165 from NathanHowell/kerberos-master
+ [spark-assembly.jar fails to authenticate with YARN ResourceManager]
+
+ a81fcb7 Wed Nov 13 10:41:01 2013 -0800
+ Merge pull request #68 from jegonzal/BitSetSetUntilBug
+ [Addressing bug in BitSet.setUntil(ind)]
+
+ 39af914 Wed Nov 13 08:39:05 2013 -0800
+ Merge pull request #166 from ahirreddy/simr-spark-ui
+ [SIMR Backend Scheduler will now write Spark UI URL to HDFS, which is to ...]
+
+ f49ea28 Tue Nov 12 19:13:39 2013 -0800
+ Merge pull request #137 from tgravescs/sparkYarnJarsHdfsRebase
+ [Allow spark on yarn to be run from HDFS.]
+
+ 87f2f4e Tue Nov 12 16:26:09 2013 -0800
+ Merge pull request #153 from ankurdave/stop-spot-cluster
+ [Enable stopping and starting a spot cluster]
+
+ b8bf04a Tue Nov 12 16:19:50 2013 -0800
+ Merge pull request #160 from xiajunluan/JIRA-923
+ [Fix bug JIRA-923]
+
+ dfd1ebc Tue Nov 12 09:10:05 2013 -0800
+ Merge pull request #164 from tdas/kafka-fix
+ [Made block generator thread safe to fix Kafka bug.]
+
+ 2e8d450 Mon Nov 11 17:34:09 2013 -0800
+ Merge pull request #63 from jegonzal/VertexSetCleanup
+ [Cleanup of VertexSetRDD]
+
+ b8e294a Mon Nov 11 16:25:42 2013 -0800
+ Merge pull request #61 from ankurdave/pid2vid
+ [Shuffle replicated vertex attributes efficiently in columnar format]
+
+ 3d7277c Mon Nov 11 15:49:28 2013 -0800
+ Merge pull request #55 from ankurdave/aggregateNeighbors-variants
+ [Specialize mapReduceTriplets for accessing subsets of vertex attributes]
+
+ 23b53ef Mon Nov 11 12:30:02 2013 -0800
+ Merge pull request #156 from haoyuan/master
+ [add tachyon module]
+
+ 1a06f70 Sun Nov 10 10:54:44 2013 -0800
+ Merge pull request #60 from amplab/rxin
+ [Looks good to me.]
+
+ 58d4f6c Sun Nov 10 09:23:56 2013 -0800
+ Merge pull request #157 from rxin/kryo
+ [3 Kryo related changes.]
+
+ 3efc019 Sat Nov 9 17:53:49 2013 -0800
+ Merge pull request #147 from JoshRosen/fix-java-api-completeness-checker
+ [Add spark-tools assembly to spark-class'ss classpath]
+
+ 87954d4 Sat Nov 9 17:53:25 2013 -0800
+ Merge pull request #154 from soulmachine/ClusterScheduler
+ [Replace the thread inside ClusterScheduler.start() with an Akka scheduler]
+
+ f6c9462 Sat Nov 9 16:14:45 2013 -0800
+ Merge pull request #58 from jegonzal/KryoMessages
+ [Kryo messages]
+
+ 83bf192 Sat Nov 9 15:40:29 2013 -0800
+ Merge pull request #155 from rxin/jobgroup
+ [Don't reset job group when a new job description is set.]
+
+ 8af99f2 Sat Nov 9 13:48:00 2013 -0800
+ Merge pull request #149 from tgravescs/fixSecureHdfsAccess
+ [Fix secure hdfs access for spark on yarn]
+
+ 72a601e Sat Nov 9 11:55:16 2013 -0800
+ Merge pull request #152 from rxin/repl
+ [Propagate SparkContext local properties from spark-repl caller thread to the repl execution thread.]
+
+ 6ee05be Thu Nov 7 19:12:41 2013 -0800
+ Merge pull request #49 from jegonzal/graphxshell
+ [GraphX Console with Logo Text]
+
+ a9f96b5 Thu Nov 7 18:56:56 2013 -0800
+ Merge pull request #56 from jegonzal/PregelAPIChanges
+ [Changing Pregel API to use mapReduceTriplets instead of aggregateNeighbors]
+
+ 5907137 Thu Nov 7 16:58:31 2013 -0800
+ Merge pull request #54 from amplab/rxin
+ [Converted for loops to while loops in EdgePartition.]
+
+ edf4164 Thu Nov 7 16:22:43 2013 -0800
+ Merge pull request #53 from amplab/rxin
+ [Added GraphX to classpath.]
+
+ c379e10 Thu Nov 7 16:01:47 2013 -0800
+ Merge pull request #51 from jegonzal/VertexSetRDD
+ [Reverting to Array based (materialized) output in VertexSetRDD]
+
+ 3d4ad84 Thu Nov 7 11:08:27 2013 -0800
+ Merge pull request #148 from squito/include_appId
+ [Include appId in executor cmd line args]
+
+ be7e8da Wed Nov 6 23:22:47 2013 -0800
+ Merge pull request #23 from jerryshao/multi-user
+ [Add Spark multi-user support for standalone mode and Mesos]
+
+ aadeda5 Wed Nov 6 13:27:47 2013 -0800
+ Merge pull request #144 from liancheng/runjob-clean
+ [Removed unused return value in SparkContext.runJob]
+
+ 951024f Wed Nov 6 09:36:14 2013 -0800
+ Merge pull request #145 from aarondav/sls-fix
+ [Attempt to fix SparkListenerSuite breakage]
+
+ bf4e613 Tue Nov 5 23:14:09 2013 -0800
+ Merge pull request #143 from rxin/scheduler-hang
+ [Ignore a task update status if the executor doesn't exist anymore.]
+
+ 9f7b9bb Tue Nov 5 10:42:19 2013 -0800
+ Merge pull request #142 from liancheng/dagscheduler-pattern-matching
+ [Using case class deep match to simplify code in DAGScheduler.processEvent]
+
+ ca44b51 Tue Nov 5 01:32:55 2013 -0800
+ Merge pull request #50 from amplab/mergemerge
+ [Merge Spark master into graphx]
+
+ 8106532 Mon Nov 4 20:47:14 2013 -0800
+ Merge pull request #139 from aarondav/shuffle-next
+ [Never store shuffle blocks in BlockManager]
+
+ 0b26a39 Mon Nov 4 18:22:06 2013 -0800
+ Merge pull request #128 from shimingfei/joblogger-doc
+ [add javadoc to JobLogger, and some small fix]
+
+ 7a26104 Mon Nov 4 17:54:06 2013 -0800
+ Merge pull request #130 from aarondav/shuffle
+ [Memory-optimized shuffle file consolidation]
+
+ b5dc339 Sun Nov 3 20:43:15 2013 -0800
+ Merge pull request #70 from rxin/hash1
+ [Fast, memory-efficient hash set, hash table implementations optimized for primitive data types.]
+
+ 41ead7a Sat Nov 2 14:41:50 2013 -0700
+ Merge pull request #133 from Mistobaan/link_fix
+ [update default github]
+
+ d407c07 Sat Nov 2 14:36:37 2013 -0700
+ Merge pull request #134 from rxin/readme
+ [Fixed a typo in Hadoop version in README.]
+
+ e7c7b80 Fri Nov 1 17:58:10 2013 -0700
+ Merge pull request #132 from Mistobaan/doc_fix
+ [fix persistent-hdfs]
+
+ d6d11c2 Fri Nov 1 15:40:33 2013 -0700
+ Merge pull request #129 from velvia/2013-11/document-local-uris
+ [Document & finish support for local: URIs]
+
+ 99bfcc9 Thu Oct 31 21:38:10 2013 -0700
+ Merge pull request #46 from jegonzal/VertexSetWithHashSet
+ [Switched VertexSetRDD and GraphImpl to use OpenHashSet]
+
+ fcaaf86 Thu Oct 31 18:27:30 2013 -0700
+ Merge pull request #44 from jegonzal/rxinBitSet
+ [Switching to VertexSetRDD to use @rxin BitSet and OpenHash ]
+
+ 3f3c727 Thu Oct 31 09:52:25 2013 -0700
+ Merge pull request #41 from jegonzal/LineageTracking
+ [Optimizing Graph Lineage]
+
+ 944f6b8 Thu Oct 31 09:40:35 2013 -0700
+ Merge pull request #43 from amplab/FixBitSetCastException
+ [Fix BitSet cast exception]
+
+ 8f1098a Wed Oct 30 20:11:48 2013 -0700
+ Merge pull request #117 from stephenh/avoid_concurrent_modification_exception
+ [Handle ConcurrentModificationExceptions in SparkContext init.]
+
+ dc9ce16 Wed Oct 30 17:01:56 2013 -0700
+ Merge pull request #126 from kayousterhout/local_fix
+ [Fixed incorrect log message in local scheduler]
+
+ 33de11c Wed Oct 30 16:58:27 2013 -0700
+ Merge pull request #124 from tgravescs/sparkHadoopUtilFix
+ [Pull SparkHadoopUtil out of SparkEnv (jira SPARK-886)]
+
+ a0c86c3 Wed Oct 30 15:34:39 2013 -0700
+ Merge pull request #38 from jegonzal/Documentation
+ [Improving Documentation]
+
+ 618c1f6 Wed Oct 30 12:03:44 2013 -0700
+ Merge pull request #125 from velvia/2013-10/local-jar-uri
+ [Add support for local:// URI scheme for addJars()]
+
+ 745dc42 Tue Oct 29 23:47:10 2013 -0700
+ Merge pull request #118 from JoshRosen/blockinfo-memory-usage
+ [Reduce the memory footprint of BlockInfo objects]
+
+ 06adf63 Tue Oct 29 16:43:46 2013 -0700
+ Merge pull request #33 from kellrott/master
+ [Fixing graph/pom.xml]
+
+ 098768e Tue Oct 29 15:08:36 2013 -0700
+ Merge pull request #37 from jegonzal/AnalyticsCleanup
+ [Updated Connected Components and Pregel Docs]
+
+ f0e23a0 Tue Oct 29 01:41:44 2013 -0400
+ Merge pull request #119 from soulmachine/master
+ [A little revise for the document]
+
+ aec9bf9 Sun Oct 27 19:32:00 2013 -0700
+ Merge pull request #112 from kayousterhout/ui_task_attempt_id
+ [Display both task ID and task attempt ID in UI, and rename taskId to taskAttemptId]
+
+ d4df474 Sun Oct 27 22:11:21 2013 -0400
+ Merge pull request #115 from aarondav/shuffle-fix
+ [Eliminate extra memory usage when shuffle file consolidation is disabled]
+
+ e018f2d Sat Oct 26 11:39:15 2013 -0700
+ Merge pull request #113 from pwendell/master
+ [Improve error message when multiple assembly jars are present.]
+
+ 662ee9f Sat Oct 26 11:35:59 2013 -0700
+ Merge pull request #114 from soulmachine/master
+ [A little revise for the document]
+
+ bab496c Fri Oct 25 18:28:43 2013 -0700
+ Merge pull request #108 from alig/master
+ [Changes to enable executing by using HDFS as a synchronization point between driver and executors, as well as ensuring executors exit properly.]
+
+ d307db6 Fri Oct 25 17:26:06 2013 -0700
+ Merge pull request #102 from tdas/transform
+ [Added new Spark Streaming operations]
+
+ 85e2cab Fri Oct 25 14:46:06 2013 -0700
+ Merge pull request #111 from kayousterhout/ui_name
+ [Properly display the name of a stage in the UI.]
+
+ ab35ec4 Fri Oct 25 10:16:18 2013 -0700
+ Merge pull request #110 from pwendell/master
+ [Exclude jopt from kafka dependency.]
+
+ 4f2c943 Thu Oct 24 22:32:02 2013 -0700
+ Merge pull request #109 from pwendell/master
+ [Adding Java/Java Streaming versions of `repartition` with associated tests]
+
+ 99ad4a6 Thu Oct 24 17:08:39 2013 -0700
+ Merge pull request #106 from pwendell/master
+ [Add a `repartition` operator.]
+
+ 5429d62 Thu Oct 24 11:15:55 2013 -0700
+ Merge pull request #107 from ScrapCodes/scala-2.10
+ [Updating to latest akka 2.2.3, which fixes our only failing test Driver Suite.]
+
+ 6f82c42 Thu Oct 24 11:09:46 2013 -0700
+ Merge pull request #34 from jegonzal/AnalyticsCleanup
+ [Analytics Cleanup]
+
+ 1dc776b Wed Oct 23 22:05:52 2013 -0700
+ Merge pull request #93 from kayousterhout/ui_new_state
+ [Show "GETTING_RESULTS" state in UI.]
+
+ c4b187d Wed Oct 23 21:56:18 2013 -0700
+ Merge pull request #105 from pwendell/doc-fix
+ [Fixing broken links in programming guide]
+
+ a098438 Wed Oct 23 18:03:08 2013 -0700
+ Merge pull request #103 from JoshRosen/unpersist-fix
+ [Add unpersist() to JavaDoubleRDD and JavaPairRDD.]
+
+ dd65964 Wed Oct 23 15:07:59 2013 -0700
+ Merge pull request #64 from prabeesh/master
+ [MQTT Adapter for Spark Streaming]
+
+ 452aa36 Tue Oct 22 23:15:33 2013 -0700
+ Merge pull request #97 from ewencp/pyspark-system-properties
+ [Add classmethod to SparkContext to set system properties.]
+
+ 9dfcf53 Tue Oct 22 16:01:42 2013 -0700
+ Merge pull request #100 from JoshRosen/spark-902
+ [Remove redundant Java Function call() definitions]
+
+ 49d5cda Tue Oct 22 15:38:02 2013 -0700
+ Merge pull request #30 from jegonzal/VertexSetRDD_Tests
+ [Testing and Documenting VertexSetRDD]
+
+ 97184de Tue Oct 22 13:10:14 2013 -0700
+ Merge pull request #99 from pwendell/master
+ [Use correct formatting for comments in StoragePerfTester]
+
+ c404adb Tue Oct 22 11:30:19 2013 -0700
+ Merge pull request #90 from pwendell/master
+ [SPARK-940: Do not directly pass Stage objects to SparkListener.]
+
+ aa9019f Tue Oct 22 10:30:02 2013 -0700
+ Merge pull request #98 from aarondav/docs
+ [Docs: Fix links to RDD API documentation]
+
+ a0e08f0 Tue Oct 22 10:20:43 2013 -0700
+ Merge pull request #82 from JoshRosen/map-output-tracker-refactoring
+ [Split MapOutputTracker into Master/Worker classes]
+
+ b84193c Mon Oct 21 23:35:13 2013 -0700
+ Merge pull request #92 from tgravescs/sparkYarnFixClasspath
+ [Fix the Worker to use CoarseGrainedExecutorBackend and modify classpath ...]
+
+ 731c94e Mon Oct 21 23:31:38 2013 -0700
+ Merge pull request #56 from jerryshao/kafka-0.8-dev
+ [Upgrade Kafka 0.7.2 to Kafka 0.8.0-beta1 for Spark Streaming]
+
+ 48952d6 Mon Oct 21 22:45:00 2013 -0700
+ Merge pull request #87 from aarondav/shuffle-base
+ [Basic shuffle file consolidation]
+
+ a51359c Mon Oct 21 20:33:29 2013 -0700
+ Merge pull request #95 from aarondav/perftest
+ [Minor: Put StoragePerfTester in org/apache/]
+
+ 39d2e9b Mon Oct 21 18:58:48 2013 -0700
+ Merge pull request #94 from aarondav/mesos-fix
+ [Fix mesos urls]
+
+ aa61bfd Mon Oct 21 11:57:05 2013 -0700
+ Merge pull request #88 from rxin/clean
+ [Made the following traits/interfaces/classes non-public:]
+
+ 35886f3 Sun Oct 20 22:20:32 2013 -0700
+ Merge pull request #41 from pwendell/shuffle-benchmark
+ [Provide Instrumentation for Shuffle Write Performance]
+
+ 5b9380e Sun Oct 20 21:03:51 2013 -0700
+ Merge pull request #89 from rxin/executor
+ [Don't setup the uncaught exception handler in local mode.]
+
+ 261bcf2 Sun Oct 20 17:59:51 2013 -0700
+ Merge pull request #80 from rxin/build
+ [Exclusion rules for Maven build files.]
+
+ edc5e3f Sun Oct 20 17:18:06 2013 -0700
+ Merge pull request #75 from JoshRosen/block-manager-cleanup
+ [Code de-duplication in BlockManager]
+
+ 2a7ae17 Sun Oct 20 11:45:21 2013 -0700
+ Merge pull request #84 from rxin/kill1
+ [Added documentation for setJobGroup. Also some minor cleanup in SparkContext.]
+
+ e4abb75 Sun Oct 20 09:38:37 2013 -0700
+ Merge pull request #85 from rxin/clean
+ [Moved the top level spark package object from spark to org.apache.spark]
+
+ 136b9b3 Sun Oct 20 02:58:26 2013 -0700
+ Basic shuffle file consolidation
+ [The Spark shuffle phase can produce a large number of files, as one file is created]
+
+ 747f538 Sat Oct 19 23:40:40 2013 -0700
+ Merge pull request #83 from ewencp/pyspark-accumulator-add-method
+ [Add an add() method to pyspark accumulators.]
+
+ 6511bbe Sat Oct 19 11:34:56 2013 -0700
+ Merge pull request #78 from mosharaf/master
+ [Removed BitTorrentBroadcast and TreeBroadcast.]
+
+ f628804 Fri Oct 18 23:19:42 2013 -0700
+ Merge pull request #76 from pwendell/master
+ [Clarify compression property.]
+
+ 599dcb0 Fri Oct 18 22:49:00 2013 -0700
+ Merge pull request #74 from rxin/kill
+ [Job cancellation via job group id.]
+
+ 9cf43cf Fri Oct 18 22:07:21 2013 -0700
+ Merge pull request #28 from jegonzal/VertexSetRDD
+ [Refactoring IndexedRDD to VertexSetRDD.]
+
+ f888a5b Fri Oct 18 22:06:58 2013 -0700
+ Merge pull request #29 from ankurdave/unit-tests
+ [Unit tests for Graph and GraphOps]
+
+ 8de9706 Fri Oct 18 20:32:39 2013 -0700
+ Merge pull request #66 from shivaram/sbt-assembly-deps
+ [Add SBT target to assemble dependencies]
+
+ e5316d0 Fri Oct 18 20:30:56 2013 -0700
+ Merge pull request #68 from mosharaf/master
+ [Faster and stable/reliable broadcast]
+
+ 8d528af Fri Oct 18 20:24:10 2013 -0700
+ Merge pull request #71 from aarondav/scdefaults
+ [Spark shell exits if it cannot create SparkContext]
+
+ 0794bd7 Fri Oct 18 18:59:58 2013 -0700
+ Merge pull request #27 from jegonzal/removed_indexedrdd_from_core
+ [Removing IndexedRDD changes for spark/core]
+
+ 099977f Thu Oct 17 14:17:08 2013 -0700
+ Merge pull request #26 from ankurdave/split-vTableReplicated
+ [Great work!]
+
+ fc26e5b Thu Oct 17 13:21:07 2013 -0700
+ Merge pull request #69 from KarthikTunga/master
+ [Fix for issue SPARK-627. Implementing --config argument in the scripts.]
+
+ cf64f63 Thu Oct 17 11:12:28 2013 -0700
+ Merge pull request #67 from kayousterhout/remove_tsl
+ [Removed TaskSchedulerListener interface.]
+
+ f9973ca Wed Oct 16 15:58:41 2013 -0700
+ Merge pull request #65 from tgravescs/fixYarn
+ [Fix yarn build]
+
+ 28e9c2a Tue Oct 15 23:59:56 2013 -0700
+ Merge pull request #63 from pwendell/master
+ [Fixing spark streaming example and a bug in examples build.]
+
+ 4e46fde Tue Oct 15 23:14:27 2013 -0700
+ Merge pull request #62 from harveyfeng/master
+ [Make TaskContext's stageId publicly accessible.]
+
+ b534606 Tue Oct 15 21:25:03 2013 -0700
+ Merge pull request #8 from vchekan/checkpoint-ttl-restore
+ [Serialize and restore spark.cleaner.ttl to savepoint]
+
+ 6dbd220 Tue Oct 15 19:02:57 2013 -0700
+ Merge pull request #34 from kayousterhout/rename
+ [Renamed StandaloneX to CoarseGrainedX.]
+
+ 983b83f Tue Oct 15 19:02:46 2013 -0700
+ Merge pull request #61 from kayousterhout/daemon_thread
+ [Unified daemon thread pools]
+
+ 3249e0e Tue Oct 15 14:12:33 2013 -0700
+ Merge pull request #59 from rxin/warning
+ [Bump up logging level to warning for failed tasks.]
+
+ 678dec6 Tue Oct 15 10:51:46 2013 -0700
+ Merge pull request #58 from hsaputra/update-pom-asf
+ [Update pom.xml to use version 13 of the ASF parent pom]
+
+ e33b183 Mon Oct 14 22:25:47 2013 -0700
+ Merge pull request #29 from rxin/kill
+ [Job killing]
+
+ 3b11f43 Mon Oct 14 14:20:01 2013 -0700
+ Merge pull request #57 from aarondav/bid
+ [Refactor BlockId into an actual type]
+
+ 9979690 Sat Oct 12 21:23:26 2013 -0700
+ Merge pull request #52 from harveyfeng/hadoop-closure
+ [Add an optional closure parameter to HadoopRDD instantiation to use when creating local JobConfs.]
+
+ dca8009 Fri Oct 11 16:08:15 2013 -0700
+ Merge pull request #54 from aoiwelle/remove_unused_imports
+ [Remove unnecessary mutable imports]
+
+ 0e5052b Fri Oct 11 15:45:16 2013 -0700
+ Merge pull request #51 from ScrapCodes/scala-2.10
+ [Scala 2.10]
+
+ fb25f32 Fri Oct 11 15:44:43 2013 -0700
+ Merge pull request #53 from witgo/master
+ [Add a zookeeper compile dependency to fix build in maven]
+
+ d6ead47 Fri Oct 11 15:43:01 2013 -0700
+ Merge pull request #32 from mridulm/master
+ [Address review comments, move to incubator spark]
+
+ c71499b Thu Oct 10 17:16:42 2013 -0700
+ Merge pull request #19 from aarondav/master-zk
+ [Standalone Scheduler fault tolerance using ZooKeeper]
+
+ 5867a82 Thu Oct 10 14:02:37 2013 -0700
+ Merge pull request #19 from dcrankshaw/master
+ [Merge canonical 2d partitioner and group edges into benchmarks]
+
+ cd08f73 Thu Oct 10 13:55:47 2013 -0700
+ Merge pull request #44 from mateiz/fast-map
+ [A fast and low-memory append-only map for shuffle operations]
+
+ 4b46d51 Thu Oct 10 13:35:36 2013 -0700
+ Merge pull request #17 from amplab/product2
+ [product 2 change]
+
+ 320418f Wed Oct 9 16:55:30 2013 -0700
+ Merge pull request #49 from mateiz/kryo-fix-2
+ [Fix Chill serialization of Range objects]
+
+ 215238c Wed Oct 9 16:49:44 2013 -0700
+ Merge pull request #50 from kayousterhout/SPARK-908
+ [Fix race condition in SparkListenerSuite (fixes SPARK-908).]
+
+ 7827efc Wed Oct 9 15:07:25 2013 -0700
+ Merge pull request #46 from mateiz/py-sort-update
+ [Fix PySpark docs and an overly long line of code after #38]
+
+ 7b3ae04 Wed Oct 9 12:14:19 2013 -0700
+ Merge pull request #45 from pwendell/metrics_units
+ [Use standard abbreviation in metrics description (MBytes -> MB)]
+
+ b4fa11f Wed Oct 9 11:59:47 2013 -0700
+ Merge pull request #38 from AndreSchumacher/pyspark_sorting
+ [SPARK-705: implement sortByKey() in PySpark]
+
+ 19d445d Wed Oct 9 11:08:34 2013 -0700
+ Merge pull request #22 from GraceH/metrics-naming
+ [SPARK-900 Use coarser grained naming for metrics]
+
+ 7d50f9f Wed Oct 9 10:32:42 2013 -0700
+ Merge pull request #35 from MartinWeindel/scala-2.10
+ [Fixing inconsistencies and warnings on Scala 2.10 branch]
+
+ 3218fa7 Tue Oct 8 23:44:55 2013 -0700
+ Merge pull request #4 from MLnick/implicit-als
+ [Adding algorithm for implicit feedback data to ALS]
+
+ e67d5b9 Tue Oct 8 22:57:38 2013 -0700
+ Merge pull request #43 from mateiz/kryo-fix
+ [Don't allocate Kryo buffers unless needed]
+
+ ea34c52 Mon Oct 7 20:45:58 2013 -0700
+ Merge pull request #42 from pwendell/shuffle-read-perf
+ [Fix inconsistent and incorrect log messages in shuffle read path]
+
+ 02f37ee Mon Oct 7 15:48:52 2013 -0700
+ Merge pull request #39 from pwendell/master
+ [Adding Shark 0.7.1 to EC2 scripts]
+
+ 213b70a Mon Oct 7 10:54:22 2013 -0700
+ Merge pull request #31 from sundeepn/branch-0.8
+ [Resolving package conflicts with hadoop 0.23.9]
+
+ d585613 Sat Oct 5 22:57:05 2013 -0700
+ Merge pull request #37 from pwendell/merge-0.8
+ [merge in remaining changes from `branch-0.8`]
+
+ 4a25b11 Sat Oct 5 19:28:55 2013 -0700
+ Merge pull request #20 from harveyfeng/hadoop-config-cache
+ [Allow users to pass broadcasted Configurations and cache InputFormats across Hadoop file reads.]
+
+ 8fc68d0 Sat Oct 5 17:24:35 2013 -0700
+ Merge pull request #36 from pwendell/versions
+ [Bumping EC2 default version in master to .]
+
+ 100222b Sat Oct 5 13:38:59 2013 -0700
+ Merge pull request #27 from davidmccauley/master
+ [SPARK-920/921 - JSON endpoint updates]
+
+ 0864193 Sat Oct 5 13:25:18 2013 -0700
+ Merge pull request #33 from AndreSchumacher/pyspark_partition_key_change
+ [Fixing SPARK-602: PythonPartitioner]
+
+ 61ffcde Fri Oct 4 10:52:17 2013 -0700
+ Merge pull request #15 from dcrankshaw/master
+ [Add synthetic generators]
+
+ 3fe12cc Fri Oct 4 10:51:28 2013 -0700
+ Merge pull request #946 from ScrapCodes/scala-2.10
+ [Fixed non termination of Executor backend, when sc.stop is not called and system.exit instead.]
+
+ 232765f Thu Oct 3 12:00:48 2013 -0700
+ Merge pull request #26 from Du-Li/master
+ [fixed a wildcard bug in make-distribution.sh; ask sbt to check local]
+
+ 405e69b Thu Oct 3 10:52:41 2013 -0700
+ Merge pull request #25 from CruncherBigData/master
+ [Update README: updated the link]
+
+ 49dbfcc Thu Oct 3 10:52:06 2013 -0700
+ Merge pull request #28 from tgravescs/sparYarnAppName
+ [Allow users to set the application name for Spark on Yarn]
+
+ e597ea3 Wed Oct 2 21:14:24 2013 -0700
+ Merge pull request #10 from kayousterhout/results_through-bm
+ [Send Task results through the block manager when larger than Akka frame size (fixes SPARK-669).]
+
+ 714fdab Thu Sep 26 14:28:55 2013 -0700
+ Merge pull request #17 from rxin/optimize
+ [Remove -optimize flag]
+
+ 13eced7 Thu Sep 26 14:18:19 2013 -0700
+ Merge pull request #16 from pwendell/master
+ [Bug fix in master build]
+
+ 70a0b99 Thu Sep 26 14:11:54 2013 -0700
+ Merge pull request #14 from kayousterhout/untangle_scheduler
+ [Improved organization of scheduling packages.]
+
+ afd03b2 Thu Sep 26 14:09:55 2013 -0700
+ Merge pull request #943 from ScrapCodes/scala-2.10
+ [Scala 2.10 with akka 2.2]
+
+ 76677b8 Thu Sep 26 14:03:46 2013 -0700
+ Merge pull request #670 from jey/ec2-ssh-improvements
+ [EC2 SSH improvements]
+
+ c514cd1 Thu Sep 26 13:48:20 2013 -0700
+ Merge pull request #930 from holdenk/master
+ [Add mapPartitionsWithIndex]
+
+ 560ee5c Thu Sep 26 11:27:34 2013 -0700
+ Merge pull request #7 from wannabeast/memorystore-fixes
+ [some minor fixes to MemoryStore]
+
+ 6566a19 Thu Sep 26 08:01:04 2013 -0700
+ Merge pull request #9 from rxin/limit
+ [Smarter take/limit implementation.]
+
+ 834686b Sun Sep 22 15:06:48 2013 -0700
+ Merge pull request #928 from jerryshao/fairscheduler-refactor
+ [Refactor FairSchedulableBuilder]
+
+ a2ea069 Sat Sep 21 23:04:42 2013 -0700
+ Merge pull request #937 from jerryshao/localProperties-fix
+ [Fix PR926 local properties issues in Spark Streaming like scenarios]
+
+ f06f2da Sat Sep 21 22:43:34 2013 -0700
+ Merge pull request #941 from ilikerps/master
+ [Add "org.apache." prefix to packages in spark-class]
+
+ 7bb12a2 Sat Sep 21 22:42:46 2013 -0700
+ Merge pull request #940 from ankurdave/clear-port-properties-after-tests
+ [After unit tests, clear port properties unconditionally]
+
+ a00317b Fri Sep 20 11:29:31 2013 -0700
+ Merge pull request #1 from ankurdave/aggregateNeighbors-returns-graph
+ [Return Graph from Graph.aggregateNeighbors]
+
+ 6a5e665 Thu Sep 19 22:41:44 2013 -0700
+ Merge pull request #3 from ankurdave/clear-port-properties-after-tests
+ [After unit tests, clear port properties unconditionally ]
+
+ 68ad33a Thu Sep 19 21:30:27 2013 -0700
+ Merge pull request #2 from ankurdave/package-fixes
+ [Package fixes (spark.graph -> org.apache.spark.graph)]
+
+ cd7222c Thu Sep 19 14:21:24 2013 -0700
+ Merge pull request #938 from ilikerps/master
+ [Fix issue with spark_ec2 seeing empty security groups]
+
+ e0dd24d Sat Aug 31 17:54:15 2013 -0700
+ Merge pull request #879 from AndreSchumacher/scala-2.10
+ [PySpark: replacing class manifest by class tag for Scala 2.10.2 in rdd.py]
+
+ ad61349 Thu Jul 18 13:53:48 2013 -0700
+ Merge pull request #709 from ScrapCodes/scala-2.10
+ [Fixed warnings in scala 2.10 branch.]
+
+ a289ded Mon Jul 15 15:59:43 2013 -0700
+ Merge pull request #700 from ScrapCodes/scala-2.10
+ [Scala 2.10 ]
+
+ 1044a95 Fri Jun 14 20:04:24 2013 -0700
+ Merge pull request #652 from ScrapCodes/scala-2.10
+ [Fixed maven build without netty fix]
+
+ 4b57f83 Sat Apr 20 10:40:07 2013 -0700
+ Merge pull request #535 from ScrapCodes/scala-2.10-repl-port
+ [porting of repl to scala-2.10]
+
+ 73b3fee Sun Jan 20 10:11:49 2013 -0800
+ Merge pull request #388 from folone/master
+ [Updated maven build configuration for Scala 2.10]
+
+ 20adf27 Tue Jan 15 11:03:49 2013 -0800
+ Merge pull request #371 from folone/master
+ [Scala 2.10.0]
+
+Release 0.8.0-incubating
+
+ 2aff798 Sun Sep 15 14:05:04 2013 -0700
+ Merge pull request #933 from jey/yarn-typo-fix
+ [Fix typo in Maven build docs]
+
+ dbd2c4f Sun Sep 15 13:20:41 2013 -0700
+ Merge pull request #932 from pwendell/mesos-version
+ [Bumping Mesos version to 0.13.0]
+
+ 9fb0b9d Sun Sep 15 13:02:53 2013 -0700
+ Merge pull request #931 from pwendell/yarn-docs
+ [Explain yarn.version in Maven build docs]
+
+ c4c1db2 Fri Sep 13 19:52:12 2013 -0700
+ Merge pull request #929 from pwendell/master
+ [Use different Hadoop version for YARN artifacts.]
+
+ a310de6 Wed Sep 11 19:36:11 2013 -0700
+ Merge pull request #926 from kayousterhout/dynamic
+ [Changed localProperties to use ThreadLocal (not DynamicVariable).]
+
+ 58c7d8b Wed Sep 11 17:33:42 2013 -0700
+ Merge pull request #927 from benh/mesos-docs
+ [Updated Spark on Mesos documentation.]
+
+ 91a59e6 Wed Sep 11 10:21:48 2013 -0700
+ Merge pull request #919 from mateiz/jets3t
+ [Add explicit jets3t dependency, which is excluded in hadoop-client]
+
+ b9128d3 Wed Sep 11 10:03:06 2013 -0700
+ Merge pull request #922 from pwendell/port-change
+ [Change default port number from 3030 to 4030.]
+
+ e07eef8 Wed Sep 11 07:35:39 2013 -0700
+ Merge pull request #925 from davidmccauley/master
+ [SPARK-894 - Not all WebUI fields delivered VIA JSON]
+
+ 8432f27 Tue Sep 10 23:19:53 2013 -0700
+ Merge pull request #923 from haoyuan/master
+ [fix run-example script]
+
+ d40f140 Tue Sep 10 23:05:29 2013 -0700
+ Merge pull request #921 from pwendell/master
+ [Fix HDFS access bug with assembly build.]
+
+ 0a6c051 Mon Sep 9 23:37:57 2013 -0700
+ Merge pull request #918 from pwendell/branch-0.8
+ [Update versions for 0.8.0 release.]
+
+ 8c14f4b Mon Sep 9 22:07:58 2013 -0700
+ Merge pull request #917 from pwendell/master
+ [Document libgfortran dependency for MLBase]
+
+ c81377b Mon Sep 9 20:16:19 2013 -0700
+ Merge pull request #915 from ooyala/master
+ [Get rid of / improve ugly NPE when Utils.deleteRecursively() fails]
+
+ 61d2a01 Mon Sep 9 18:21:01 2013 -0700
+ Merge pull request #916 from mateiz/mkdist-fix
+ [Fix copy issue in https://github.com/mesos/spark/pull/899]
+
+ a85758c Mon Sep 9 13:45:40 2013 -0700
+ Merge pull request #907 from stephenh/document_coalesce_shuffle
+ [Add better docs for coalesce.]
+
+ 084fc36 Mon Sep 9 12:01:35 2013 -0700
+ Merge pull request #912 from tgravescs/ganglia-pom
+ [Add metrics-ganglia to core pom file]
+
+ 0456384 Mon Sep 9 09:57:54 2013 -0700
+ Merge pull request #911 from pwendell/ganglia-sink
+ [Adding Manen dependency for Ganglia]
+
+ bf984e2 Sun Sep 8 23:50:24 2013 -0700
+ Merge pull request #890 from mridulm/master
+ [Fix hash bug]
+
+ e9d4f44 Sun Sep 8 23:36:48 2013 -0700
+ Merge pull request #909 from mateiz/exec-id-fix
+ [Fix an instance where full standalone mode executor IDs were passed to]
+
+ 2447b1c Sun Sep 8 22:27:49 2013 -0700
+ Merge pull request #910 from mateiz/ml-doc-tweaks
+ [Small tweaks to MLlib docs]
+
+ 7d3204b Sun Sep 8 21:39:12 2013 -0700
+ Merge pull request #905 from mateiz/docs2
+ [Job scheduling and cluster mode docs]
+
+ f1f8371 Sun Sep 8 21:26:11 2013 -0700
+ Merge pull request #896 from atalwalkar/master
+ [updated content]
+
+ f68848d Sun Sep 8 18:32:16 2013 -0700
+ Merge pull request #906 from pwendell/ganglia-sink
+ [Clean-up of Metrics Code/Docs and Add Ganglia Sink]
+
+ 0b95799 Sun Sep 8 15:30:16 2013 -0700
+ Merge pull request #908 from pwendell/master
+ [Fix target JVM version in scala build]
+
+ 04cfb3a Sun Sep 8 10:33:20 2013 -0700
+ Merge pull request #898 from ilikerps/660
+ [SPARK-660: Add StorageLevel support in Python]
+
+ 38488ac Sun Sep 8 00:28:53 2013 -0700
+ Merge pull request #900 from pwendell/cdh-docs
+ [Provide docs to describe running on CDH/HDP cluster.]
+
+ a8e376e Sat Sep 7 21:16:01 2013 -0700
+ Merge pull request #904 from pwendell/master
+ [Adding Apache license to two files]
+
+ cfde85e Sat Sep 7 13:53:08 2013 -0700
+ Merge pull request #901 from ooyala/2013-09/0.8-doc-changes
+ [0.8 Doc changes for make-distribution.sh]
+
+ 4a7813a Sat Sep 7 13:52:24 2013 -0700
+ Merge pull request #903 from rxin/resulttask
+ [Fixed the bug that ResultTask was not properly deserializing outputId.]
+
+ afe46ba Sat Sep 7 07:28:51 2013 -0700
+ Merge pull request #892 from jey/fix-yarn-assembly
+ [YARN build fixes]
+
+ 2eebeff Fri Sep 6 15:25:22 2013 -0700
+ Merge pull request #897 from pwendell/master
+ [Docs describing Spark monitoring and instrumentation]
+
+ ddcb9d3 Thu Sep 5 23:54:09 2013 -0700
+ Merge pull request #895 from ilikerps/821
+ [SPARK-821: Don't cache results when action run locally on driver]
+
+ 699c331 Thu Sep 5 20:21:53 2013 -0700
+ Merge pull request #891 from xiajunluan/SPARK-864
+ [[SPARK-864]DAGScheduler Exception if we delete Worker and StandaloneExecutorBackend then add Worker]
+
+ 5c7494d Wed Sep 4 22:47:03 2013 -0700
+ Merge pull request #893 from ilikerps/master
+ [SPARK-884: Add unit test to validate Spark JSON output]
+
+ a547866 Wed Sep 4 21:11:56 2013 -0700
+ Merge pull request #894 from c0s/master
+ [Updating assembly README to reflect recent changes in the build.]
+
+ 19f7027 Tue Sep 3 14:29:10 2013 -0700
+ Merge pull request #878 from tgravescs/yarnUILink
+ [Link the Spark UI up to the Yarn UI ]
+
+ 68df246 Tue Sep 3 13:01:17 2013 -0700
+ Merge pull request #889 from alig/master
+ [Return the port the WebUI is bound to (useful if port 0 was used)]
+
+ d3dd48f Mon Sep 2 16:44:54 2013 -0700
+ Merge pull request #887 from mateiz/misc-fixes
+ [Miscellaneous fixes for 0.8]
+
+ 636fc0c Mon Sep 2 11:20:39 2013 -0700
+ Merge pull request #886 from mateiz/codec
+ [Fix spark.io.compression.codec and change default codec to LZF]
+
+ d9a53b9 Sun Sep 1 22:12:30 2013 -0700
+ Merge pull request #885 from mateiz/win-py
+ [Allow PySpark to run on Windows]
+
+ 3c520fe Sun Sep 1 17:26:55 2013 -0700
+ Merge pull request #884 from mateiz/win-fixes
+ [Run script fixes for Windows after package & assembly change]
+
+ f957c26 Sun Sep 1 14:53:57 2013 -0700
+ Merge pull request #882 from mateiz/package-rename
+ [Rename spark package to org.apache.spark]
+
+ a30fac1 Sun Sep 1 12:27:50 2013 -0700
+ Merge pull request #883 from alig/master
+ [Don't require the spark home environment variable to be set for standalone mode (change needed by SIMR)]
+
+ 03cc765 Sun Sep 1 10:20:56 2013 -0700
+ Merge pull request #881 from pwendell/master
+ [Extend QuickStart to include next steps]
+
+ 0e9565a Sat Aug 31 18:55:41 2013 -0700
+ Merge pull request #880 from mateiz/ui-tweaks
+ [Various UI tweaks]
+
+ 2b29a1d Sat Aug 31 17:49:45 2013 -0700
+ Merge pull request #877 from mateiz/docs
+ [Doc improvements for 0.8]
+
+ 6edef9c Sat Aug 31 13:39:24 2013 -0700
+ Merge pull request #861 from AndreSchumacher/pyspark_sampling_function
+ [Pyspark sampling function]
+
+ fd89835 Sat Aug 31 13:18:12 2013 -0700
+ Merge pull request #870 from JoshRosen/spark-885
+ [Don't send SIGINT / ctrl-c to Py4J gateway subprocess]
+
+ 618f0ec Fri Aug 30 18:17:13 2013 -0700
+ Merge pull request #869 from AndreSchumacher/subtract
+ [PySpark: implementing subtractByKey(), subtract() and keyBy()]
+
+ 94bb7fd Fri Aug 30 12:05:13 2013 -0700
+ Merge pull request #876 from mbautin/master_hadoop_rdd_conf
+ [Make HadoopRDD's configuration accessible]
+
+ 9e17e45 Fri Aug 30 00:22:53 2013 -0700
+ Merge pull request #875 from shivaram/build-fix
+ [Fix broken build by removing addIntercept]
+
+ 016787d Thu Aug 29 22:15:14 2013 -0700
+ Merge pull request #863 from shivaram/etrain-ridge
+ [Adding linear regression and refactoring Ridge regression to use SGD]
+
+ 852d810 Thu Aug 29 22:13:15 2013 -0700
+ Merge pull request #819 from shivaram/sgd-cleanup
+ [Change SVM to use {0,1} labels]
+
+ ca71620 Thu Aug 29 21:51:14 2013 -0700
+ Merge pull request #857 from mateiz/assembly
+ [Change build and run instructions to use assemblies]
+
+ 1528776 Thu Aug 29 21:30:47 2013 -0700
+ Merge pull request #874 from jerryshao/fix-report-bug
+ [Fix removed block zero size log reporting]
+
+ abdbacf Wed Aug 28 21:11:31 2013 -0700
+ Merge pull request #871 from pwendell/expose-local
+ [Expose `isLocal` in SparkContext.]
+
+ afcade3 Wed Aug 28 20:15:40 2013 -0700
+ Merge pull request #873 from pwendell/master
+ [Hot fix for command runner]
+
+ baa84e7 Wed Aug 28 12:44:46 2013 -0700
+ Merge pull request #865 from tgravescs/fixtmpdir
+ [Spark on Yarn should use yarn approved directories for spark.local.dir and tmp]
+
+ cd043cf Tue Aug 27 19:50:32 2013 -0700
+ Merge pull request #867 from tgravescs/yarnenvconfigs
+ [Spark on Yarn allow users to specify environment variables ]
+
+ 898da7e Mon Aug 26 20:40:49 2013 -0700
+ Merge pull request #859 from ianbuss/sbt_opts
+ [Pass SBT_OPTS environment through to sbt_launcher]
+
+ 17bafea Mon Aug 26 11:59:32 2013 -0700
+ Merge pull request #864 from rxin/json1
+ [Revert json library change]
+
+ f9fc5c1 Sat Aug 24 15:19:56 2013 -0700
+ Merge pull request #603 from pwendell/ec2-updates
+ [Several Improvements to EC2 Scripts]
+
+ d282c1e Fri Aug 23 11:20:20 2013 -0700
+ Merge pull request #860 from jey/sbt-ide-fixes
+ [Fix IDE project generation under SBT]
+
+ 5a6ac12 Thu Aug 22 22:08:03 2013 -0700
+ Merge pull request #701 from ScrapCodes/documentation-suggestions
+ [Documentation suggestions for spark streaming.]
+
+ 46ea0c1 Thu Aug 22 15:57:28 2013 -0700
+ Merge pull request #814 from holdenk/master
+ [Create less instances of the random class during ALS initialization.]
+
+ 9ac3d62 Thu Aug 22 15:51:10 2013 -0700
+ Merge pull request #856 from jey/sbt-fix-hadoop-0.23.9
+ [Re-add removed dependency to fix build under Hadoop 0.23.9]
+
+ ae8ba83 Thu Aug 22 10:14:54 2013 -0700
+ Merge pull request #855 from jey/update-build-docs
+ [Update build docs]
+
+ 8a36fd0 Thu Aug 22 10:13:35 2013 -0700
+ Merge pull request #854 from markhamstra/pomUpdate
+ [Synced sbt and maven builds to use the same dependencies, etc.]
+
+ c2d00f1 Thu Aug 22 10:13:03 2013 -0700
+ Merge pull request #832 from alig/coalesce
+ [Coalesced RDD with locality]
+
+ e6d66c8 Wed Aug 21 17:44:31 2013 -0700
+ Merge pull request #853 from AndreSchumacher/double_rdd
+ [Implementing SPARK-838: Add DoubleRDDFunctions methods to PySpark]
+
+ 2905611 Tue Aug 20 17:36:14 2013 -0700
+ Merge pull request #851 from markhamstra/MutablePairTE
+ [Removed meaningless types]
+
+ d61337f Tue Aug 20 10:06:06 2013 -0700
+ Merge pull request #844 from markhamstra/priorityRename
+ [Renamed 'priority' to 'jobId' and assorted minor changes]
+
+ 8cae72e Mon Aug 19 23:40:04 2013 -0700
+ Merge pull request #828 from mateiz/sched-improvements
+ [Scheduler fixes and improvements]
+
+ efeb142 Mon Aug 19 19:23:50 2013 -0700
+ Merge pull request #849 from mateiz/web-fixes
+ [Small fixes to web UI]
+
+ abdc1f8 Mon Aug 19 18:30:56 2013 -0700
+ Merge pull request #847 from rxin/rdd
+ [Allow subclasses of Product2 in all key-value related classes]
+
+ 8fa0747 Sun Aug 18 17:02:54 2013 -0700
+ Merge pull request #840 from AndreSchumacher/zipegg
+ [Implementing SPARK-878 for PySpark: adding zip and egg files to context ...]
+
+ 1e137a5 Sat Aug 17 22:22:32 2013 -0700
+ Merge pull request #846 from rxin/rdd
+ [Two minor RDD refactoring]
+
+ e89ffc7 Fri Aug 16 14:02:34 2013 -0700
+ Merge pull request #839 from jegonzal/zip_partitions
+ [Currying RDD.zipPartitions ]
+
+ 1fb1b09 Thu Aug 15 22:15:05 2013 -0700
+ Merge pull request #841 from rxin/json
+ [Use the JSON formatter from Scala library and removed dependency on lift-json.]
+
+ c69c489 Thu Aug 15 20:55:09 2013 -0700
+ Merge pull request #843 from Reinvigorate/bug-879
+ [fixing typo in conf/slaves]
+
+ 230ab27 Thu Aug 15 17:45:17 2013 -0700
+ Merge pull request #834 from Daemoen/master
+ [Updated json output to allow for display of worker state]
+
+ 659553b Thu Aug 15 16:56:31 2013 -0700
+ Merge pull request #836 from pwendell/rename
+ [Rename `memoryBytesToString` and `memoryMegabytesToString`]
+
+ 28369ff Thu Aug 15 16:44:02 2013 -0700
+ Merge pull request #829 from JoshRosen/pyspark-unit-tests-python-2.6
+ [Fix PySpark unit tests on Python 2.6]
+
+ 1a13460 Thu Aug 15 15:50:44 2013 -0700
+ Merge pull request #833 from rxin/ui
+ [Various UI improvements.]
+
+ 044a088 Wed Aug 14 20:43:49 2013 -0700
+ Merge pull request #831 from rxin/scheduler
+ [A few small scheduler / job description changes.]
+
+ 839f2d4 Wed Aug 14 16:17:23 2013 -0700
+ Merge pull request #822 from pwendell/ui-features
+ [Adding GC Stats to TaskMetrics (and three small fixes)]
+
+ 63446f9 Wed Aug 14 00:17:07 2013 -0700
+ Merge pull request #826 from kayousterhout/ui_fix
+ [Fixed 2 bugs in executor UI (incl. SPARK-877)]
+
+ 3f14cba Tue Aug 13 20:09:51 2013 -0700
+ Merge pull request #825 from shivaram/maven-repl-fix
+ [Set SPARK_CLASSPATH for maven repl tests]
+
+ 596adc6 Tue Aug 13 19:41:34 2013 -0700
+ Merge pull request #824 from mateiz/mesos-0.12.1
+ [Update to Mesos 0.12.1]
+
+ d316af9 Tue Aug 13 15:31:01 2013 -0700
+ Merge pull request #821 from pwendell/print-launch-command
+ [Print run command to stderr rather than stdout]
+
+ 1f79d21 Tue Aug 13 15:23:54 2013 -0700
+ Merge pull request #818 from kayousterhout/killed_fix
+ [Properly account for killed tasks.]
+
+ 622f83c Tue Aug 13 09:58:52 2013 -0700
+ Merge pull request #817 from pwendell/pr_784
+ [Minor clean-up in metrics servlet code]
+
+ a0133bf Tue Aug 13 09:28:18 2013 -0700
+ Merge pull request #784 from jerryshao/dev-metrics-servlet
+ [Add MetricsServlet for Spark metrics system]
+
+ e2fdac6 Mon Aug 12 21:26:59 2013 -0700
+ Merge pull request #802 from stayhf/SPARK-760-Python
+ [Simple PageRank algorithm implementation in Python for SPARK-760]
+
+ d3525ba Mon Aug 12 21:02:39 2013 -0700
+ Merge pull request #813 from AndreSchumacher/add_files_pyspark
+ [Implementing SPARK-865: Add the equivalent of ADD_JARS to PySpark]
+
+ 9e02da2 Mon Aug 12 20:22:27 2013 -0700
+ Merge pull request #812 from shivaram/maven-mllib-tests
+ [Create SparkContext in beforeAll for MLLib tests]
+
+ 65d0d91 Mon Aug 12 19:00:57 2013 -0700
+ Merge pull request #807 from JoshRosen/guava-optional
+ [Change scala.Option to Guava Optional in Java APIs]
+
+ 4346f0a Mon Aug 12 12:12:12 2013 -0700
+ Merge pull request #809 from shivaram/sgd-cleanup
+ [Clean up scaladoc in ML Lib.]
+
+ ea1b4ba Mon Aug 12 08:09:58 2013 -0700
+ Merge pull request #806 from apivovarov/yarn-205
+ [Changed yarn.version to 2.0.5 in pom.xml]
+
+ 2a39d2c Sun Aug 11 20:35:09 2013 -0700
+ Merge pull request #810 from pwendell/dead_doc_code
+ [Remove now dead code inside of docs]
+
+ e5b9ed2 Sun Aug 11 17:22:47 2013 -0700
+ Merge pull request #808 from pwendell/ui_compressed_bytes
+ [Report compressed bytes read when calculating TaskMetrics]
+
+ 3796486 Sun Aug 11 14:51:47 2013 -0700
+ Merge pull request #805 from woggle/hadoop-rdd-jobconf
+ [Use new Configuration() instead of slower new JobConf() in SerializableWritable]
+
+ ff9ebfa Sun Aug 11 10:52:55 2013 -0700
+ Merge pull request #762 from shivaram/sgd-cleanup
+ [Refactor SGD options into a new class.]
+
+ 95c62ca Sun Aug 11 10:30:52 2013 -0700
+ Merge pull request #804 from apivovarov/master
+ [Fixed path to JavaALS.java and JavaKMeans.java, fixed hadoop2-yarn profi...]
+
+ 06e4f2a Sat Aug 10 18:06:23 2013 -0700
+ Merge pull request #789 from MLnick/master
+ [Adding Scala version of PageRank example]
+
+ 71c63de Sat Aug 10 10:21:20 2013 -0700
+ Merge pull request #795 from mridulm/master
+ [Fix bug reported in PR 791 : a race condition in ConnectionManager and Connection]
+
+ d17eeb9 Sat Aug 10 09:02:27 2013 -0700
+ Merge pull request #785 from anfeng/master
+ [expose HDFS file system stats via Executor metrics]
+
+ dce5e47 Fri Aug 9 21:53:45 2013 -0700
+ Merge pull request #800 from dlyubimov/HBASE_VERSION
+ [Pull HBASE_VERSION in the head of sbt build]
+
+ cd247ba Fri Aug 9 20:41:13 2013 -0700
+ Merge pull request #786 from shivaram/mllib-java
+ [Java fixes, tests and examples for ALS, KMeans]
+
+ b09d4b7 Fri Aug 9 13:17:08 2013 -0700
+ Merge pull request #799 from woggle/sync-fix
+ [Remove extra synchronization in ResultTask]
+
+ 0bc63bf Fri Aug 9 13:16:25 2013 -0700
+ Merge pull request #801 from pwendell/print-launch-command
+ [Print launch command [Branch 0.8 version]]
+
+ cc6b92e Fri Aug 9 13:00:33 2013 -0700
+ Merge pull request #775 from pwendell/print-launch-command
+ [Log the launch command for Spark daemons]
+
+ f94fc75 Fri Aug 9 10:04:03 2013 -0700
+ Merge pull request #788 from shane-huang/sparkjavaopts
+ [For standalone mode, add worker local env setting of SPARK_JAVA_OPTS as ...]
+
+ 63b6e02 Thu Aug 8 14:02:02 2013 -0700
+ Merge pull request #797 from mateiz/chill-0.3.1
+ [Update to Chill 0.3.1]
+
+ 9955e5a Thu Aug 8 11:03:38 2013 -0700
+ Merge pull request #796 from pwendell/bootstrap-design
+ [Bootstrap re-design]
+
+ 5133e4b Wed Aug 7 15:50:45 2013 -0700
+ Merge pull request #790 from kayousterhout/fix_throughput
+ [Fixed issue in UI that decreased scheduler throughput by 5x or more]
+
+ 3c8478e Tue Aug 6 23:25:03 2013 -0700
+ Merge pull request #747 from mateiz/improved-lr
+ [Update the Python logistic regression example]
+
+ 6b043a6 Tue Aug 6 22:31:02 2013 -0700
+ Merge pull request #724 from dlyubimov/SPARK-826
+ [SPARK-826: fold(), reduce(), collect() always attempt to use java serialization]
+
+ de6c4c9 Tue Aug 6 17:09:50 2013 -0700
+ Merge pull request #787 from ash211/master
+ [Update spark-standalone.md]
+
+ df4d10d Tue Aug 6 15:44:05 2013 -0700
+ Merge pull request #779 from adatao/adatao-global-SparkEnv
+ [[HOTFIX] Extend thread safety for SparkEnv.get()]
+
+ d2b0f0c Tue Aug 6 14:49:39 2013 -0700
+ Merge pull request #770 from stayhf/SPARK-760-Java
+ [Simple PageRank algorithm implementation in Java for SPARK-760]
+
+ d031f73 Mon Aug 5 22:33:00 2013 -0700
+ Merge pull request #782 from WANdisco/master
+ [SHARK-94 Log the files computed by HadoopRDD and NewHadoopRDD]
+
+ 1b63dea Mon Aug 5 22:21:26 2013 -0700
+ Merge pull request #769 from markhamstra/NegativeCores
+ [SPARK-847 + SPARK-845: Zombie workers and negative cores]
+
+ 828aff7 Mon Aug 5 21:37:33 2013 -0700
+ Merge pull request #776 from gingsmith/master
+ [adding matrix factorization data generator]
+
+ 8b27789 Mon Aug 5 19:14:52 2013 -0700
+ Merge pull request #774 from pwendell/job-description
+ [Show user-defined job name in UI]
+
+ 550b0cf Mon Aug 5 12:10:32 2013 -0700
+ Merge pull request #780 from cybermaster/master
+ [SPARK-850]
+
+ 22abbc1 Fri Aug 2 16:37:59 2013 -0700
+ Merge pull request #772 from karenfeng/ui-843
+ [Show app duration]
+
+ 9d7dfd2 Thu Aug 1 17:41:58 2013 -0700
+ Merge pull request #743 from pwendell/app-metrics
+ [Add application metrics to standalone master]
+
+ 6d7afd7 Thu Aug 1 17:13:28 2013 -0700
+ Merge pull request #768 from pwendell/pr-695
+ [Minor clean-up of fair scheduler UI]
+
+ 5e7b38f Thu Aug 1 14:59:33 2013 -0700
+ Merge pull request #695 from xiajunluan/pool_ui
+ [Enhance job ui in spark ui system with adding pool information]
+
+ 0a96493 Thu Aug 1 11:27:17 2013 -0700
+ Merge pull request #760 from karenfeng/heading-update
+ [Clean up web UI page headers]
+
+ cb7dd86 Thu Aug 1 11:06:10 2013 -0700
+ Merge pull request #758 from pwendell/master-json
+ [Add JSON path to master index page]
+
+ 58756b7 Wed Jul 31 23:45:41 2013 -0700
+ Merge pull request #761 from mateiz/kmeans-generator
+ [Add data generator for K-means]
+
+ ecab635 Wed Jul 31 18:16:55 2013 -0700
+ Merge pull request #763 from c0s/assembly
+ [SPARK-842. Maven assembly is including examples libs and dependencies]
+
+ 39c75f3 Wed Jul 31 15:52:36 2013 -0700
+ Merge pull request #757 from BlackNiuza/result_task_generation
+ [Bug fix: SPARK-837]
+
+ b2b86c2 Wed Jul 31 15:51:39 2013 -0700
+ Merge pull request #753 from shivaram/glm-refactor
+ [Build changes for ML lib]
+
+ 14bf2fe Wed Jul 31 14:18:16 2013 -0700
+ Merge pull request #749 from benh/spark-executor-uri
+ [Added property 'spark.executor.uri' for launching on Mesos.]
+
+ 4ba4c3f Wed Jul 31 13:14:49 2013 -0700
+ Merge pull request #759 from mateiz/split-fix
+ [Use the Char version of split() instead of the String one in MLUtils]
+
+ a386ced Wed Jul 31 11:22:50 2013 -0700
+ Merge pull request #754 from rxin/compression
+ [Compression codec change]
+
+ 0be071a Wed Jul 31 11:11:59 2013 -0700
+ Merge pull request #756 from cdshines/patch-1
+ [Refactored Vector.apply(length, initializer) replacing excessive code with library method]
+
+ d4556f4 Wed Jul 31 08:48:14 2013 -0700
+ Merge pull request #751 from cdshines/master
+ [Cleaned Partitioner & PythonPartitioner source by taking out non-related logic to Utils]
+
+ 29b8cd3 Tue Jul 30 21:30:33 2013 -0700
+ Merge pull request #755 from jerryshao/add-apache-header
+ [Add Apache license header to metrics system]
+
+ e87de03 Tue Jul 30 15:00:08 2013 -0700
+ Merge pull request #744 from karenfeng/bootstrap-update
+ [Use Bootstrap progress bars in web UI]
+
+ ae57020 Tue Jul 30 14:56:41 2013 -0700
+ Merge pull request #752 from rxin/master
+ [Minor mllib cleanup]
+
+ 8aee118 Tue Jul 30 10:27:54 2013 -0700
+ Merge pull request #748 from atalwalkar/master
+ [made SimpleUpdater consistent with other updaters]
+
+ 468a36c Mon Jul 29 19:44:33 2013 -0700
+ Merge pull request #746 from rxin/cleanup
+ [Internal cleanup]
+
+ 1e1ffb1 Mon Jul 29 19:26:19 2013 -0700
+ Merge pull request #745 from shivaram/loss-update-fix
+ [Remove duplicate loss history in Gradient Descent]
+
+ c99b674 Mon Jul 29 16:32:55 2013 -0700
+ Merge pull request #735 from karenfeng/ui-807
+ [Totals for shuffle data and CPU time]
+
+ fe7298b Mon Jul 29 14:01:00 2013 -0700
+ Merge pull request #741 from pwendell/usability
+ [Fix two small usability issues]
+
+ c34c0f6 Mon Jul 29 13:18:10 2013 -0700
+ Merge pull request #731 from pxinghao/master
+ [Adding SVM and Lasso]
+
+ f3d72ff Fri Jul 26 17:19:27 2013 -0700
+ Merge pull request #739 from markhamstra/toolsPom
+ [Missing tools/pom.xml scalatest dependency]
+
+ cb36677 Fri Jul 26 16:59:30 2013 -0700
+ Merge pull request #738 from harsha2010/pruning
+ [Fix bug in Partition Pruning.]
+
+ f3cf094 Thu Jul 25 14:53:21 2013 -0700
+ Merge pull request #734 from woggle/executor-env2
+ [Get more env vars from driver rather than worker]
+
+ 51c2427 Thu Jul 25 00:03:11 2013 -0700
+ Merge pull request #732 from ryanlecompte/master
+ [Refactor Kryo serializer support to use chill/chill-java]
+
+ 52723b9 Wed Jul 24 14:33:02 2013 -0700
+ Merge pull request #728 from jey/examples-jar-env
+ [Fix setting of SPARK_EXAMPLES_JAR]
+
+ 20338c2 Wed Jul 24 14:32:24 2013 -0700
+ Merge pull request #729 from karenfeng/ui-811
+ [Stage Page updates]
+
+ 5584ebc Wed Jul 24 11:46:46 2013 -0700
+ Merge pull request #675 from c0s/assembly
+ [Building spark assembly for further consumption of the Spark project with a deployed cluster]
+
+ a73f3ee Wed Jul 24 08:59:14 2013 -0700
+ Merge pull request #671 from jerryshao/master
+ [Add metrics system for Spark]
+
+ b011329 Tue Jul 23 22:50:09 2013 -0700
+ Merge pull request #727 from rxin/scheduler
+ [Scheduler code style cleanup.]
+
+ 876125b Tue Jul 23 22:28:21 2013 -0700
+ Merge pull request #726 from rxin/spark-826
+ [SPARK-829: scheduler shouldn't hang if a task contains unserializable objects in its closure]
+
+ 2f1736c Tue Jul 23 15:53:30 2013 -0700
+ Merge pull request #725 from karenfeng/task-start
+ [Creates task start events]
+
+ 5364f64 Tue Jul 23 13:40:34 2013 -0700
+ Merge pull request #723 from rxin/mllib
+ [Made RegressionModel serializable and added unit tests to make sure predict methods would work.]
+
+ f369e0e Tue Jul 23 13:22:27 2013 -0700
+ Merge pull request #720 from ooyala/2013-07/persistent-rdds-api
+ [Add a public method getCachedRdds to SparkContext]
+
+ 401aac8 Mon Jul 22 16:57:16 2013 -0700
+ Merge pull request #719 from karenfeng/ui-808
+ [Creates Executors tab for Jobs UI]
+
+ 8ae1436 Mon Jul 22 16:03:04 2013 -0700
+ Merge pull request #722 from JoshRosen/spark-825
+ [Fix bug: DoubleRDDFunctions.sampleStdev() computed non-sample stdev()]
+
+ 15fb394 Sun Jul 21 10:33:38 2013 -0700
+ Merge pull request #716 from c0s/webui-port
+ [Regression: default webui-port can't be set via command line "--webui-port" anymore]
+
+ c40f0f2 Fri Jul 19 13:33:04 2013 -0700
+ Merge pull request #711 from shivaram/ml-generators
+ [Move ML lib data generator files to util/]
+
+ 413b841 Fri Jul 19 13:31:38 2013 -0700
+ Merge pull request #717 from viirya/dev1
+ [Do not copy local jars given to SparkContext in yarn mode]
+
+ 0d0a47c Thu Jul 18 12:06:37 2013 -0700
+ Merge pull request #710 from shivaram/ml-updates
+ [Updates to LogisticRegression]
+
+ c6235b5 Thu Jul 18 11:43:48 2013 -0700
+ Merge pull request #714 from adatao/master
+ [[BUGFIX] Fix for sbt/sbt script SPARK_HOME setting]
+
+ 009c79e Thu Jul 18 11:41:52 2013 -0700
+ Merge pull request #715 from viirya/dev1
+ [fix a bug in build process that pulls in two versions of ASM.]
+
+ 985a9e3 Wed Jul 17 22:27:19 2013 -0700
+ Merge pull request #712 from stayhf/SPARK-817
+ [Consistently invoke bash with /usr/bin/env bash in scripts to make code ...]
+
+ cad48ed Tue Jul 16 21:41:28 2013 -0700
+ Merge pull request #708 from ScrapCodes/dependencies-upgrade
+ [Dependency upgrade Akka 2.0.3 -> 2.0.5]
+
+ 8a8a8f2 Mon Jul 15 23:09:21 2013 -0700
+ Merge pull request #705 from rxin/errormessages
+ [Throw a more meaningful message when runJob is called to launch tasks on non-existent partitions.]
+
+ ed8415b Mon Jul 15 16:41:04 2013 -0700
+ Merge pull request #703 from karenfeng/ui-802
+ [Link to job UI from standalone deploy cluster web UI]
+
+ e3d3e6f Mon Jul 15 14:59:44 2013 -0700
+ Merge pull request #702 from karenfeng/ui-fixes
+ [Adds app name in HTML page titles on job web UI]
+
+ c7877d5 Sun Jul 14 12:58:13 2013 -0700
+ Merge pull request #689 from BlackNiuza/application_status
+ [Bug fix: SPARK-796]
+
+ 10c0593 Sun Jul 14 11:45:18 2013 -0700
+ Merge pull request #699 from pwendell/ui-env
+ [Add `Environment` tab to SparkUI.]
+
+ 89e8549 Sat Jul 13 16:11:08 2013 -0700
+ Merge pull request #698 from Reinvigorate/sm-deps-change
+ [changing com.google.code.findbugs maven coordinates]
+
+ 77c69ae Fri Jul 12 23:05:21 2013 -0700
+ Merge pull request #697 from pwendell/block-locations
+ [Show block locations in Web UI.]
+
+ 5a7835c Fri Jul 12 20:28:21 2013 -0700
+ Merge pull request #691 from karenfeng/logpaging
+ [Create log pages]
+
+ 71ccca0 Fri Jul 12 20:25:06 2013 -0700
+ Merge pull request #696 from woggle/executor-env
+ [Pass executor env vars (e.g. SPARK_CLASSPATH) to compute-classpath.sh]
+
+ 90fc3f3 Fri Jul 12 20:23:36 2013 -0700
+ Merge pull request #692 from Reinvigorate/takeOrdered
+ [adding takeOrdered() to RDD]
+
+ 018d04c Thu Jul 11 12:48:37 2013 -0700
+ Merge pull request #684 from woggle/mesos-classloader
+ [Explicitly set class loader for MesosSchedulerDriver callbacks.]
+
+ bc19477 Wed Jul 10 22:29:41 2013 -0700
+ Merge pull request #693 from c0s/readme
+ [Updating README to reflect Scala 2.9.3 requirements]
+
+ 7dcda9a Mon Jul 8 23:24:23 2013 -0700
+ Merge pull request #688 from markhamstra/scalaDependencies
+ [Fixed SPARK-795 with explicit dependencies]
+
+ 638927b Mon Jul 8 22:58:50 2013 -0700
+ Merge pull request #683 from shivaram/sbt-test-fix
+ [Remove some stack traces from sbt test output]
+
+ 3c13178 Mon Jul 8 14:50:34 2013 -0700
+ Merge pull request #687 from atalwalkar/master
+ [Added "Labeled" to util functions for labeled data]
+
+ 744da8e Sun Jul 7 17:42:25 2013 -0700
+ Merge pull request #679 from ryanlecompte/master
+ [Make binSearch method tail-recursive for RidgeRegression]
+
+ 3cc6818 Sat Jul 6 19:51:20 2013 -0700
+ Merge pull request #668 from shimingfei/guava-14.0.1
+ [update guava version from 11.0.1 to 14.0.1]
+
+ 2216188 Sat Jul 6 16:18:15 2013 -0700
+ Merge pull request #676 from c0s/asf-avro
+ [Use standard ASF published avro module instead of a proprietory built one]
+
+ 94871e4 Sat Jul 6 15:26:19 2013 -0700
+ Merge pull request #655 from tgravescs/master
+ [Add support for running Spark on Yarn on a secure Hadoop Cluster]
+
+ 3f918b3 Sat Jul 6 12:45:18 2013 -0700
+ Merge pull request #672 from holdenk/master
+ [s/ActorSystemImpl/ExtendedActorSystem/ as ActorSystemImpl results in a warning]
+
+ 2a36e54 Sat Jul 6 12:43:21 2013 -0700
+ Merge pull request #673 from xiajunluan/master
+ [Add config template file for fair scheduler feature]
+
+ 7ba7fa1 Sat Jul 6 11:45:08 2013 -0700
+ Merge pull request #674 from liancheng/master
+ [Bug fix: SPARK-789]
+
+ f4416a1 Sat Jul 6 11:41:58 2013 -0700
+ Merge pull request #681 from BlackNiuza/memory_leak
+ [Remove active job from idToActiveJob when job finished or aborted]
+
+ e063e29 Fri Jul 5 21:54:52 2013 -0700
+ Merge pull request #680 from tdas/master
+ [Fixed major performance bug in Network Receiver]
+
+ bf1311e Fri Jul 5 17:32:44 2013 -0700
+ Merge pull request #678 from mateiz/ml-examples
+ [Start of ML package]
+
+ 6ad85d0 Thu Jul 4 21:32:29 2013 -0700
+ Merge pull request #677 from jerryshao/fix_stage_clean
+ [Clean StageToInfos periodically when spark.cleaner.ttl is enabled]
+
+ 2e32fc8 Thu Jul 4 12:18:20 2013 -0700
+ Merge pull request #666 from c0s/master
+ [hbase dependency is missed in hadoop2-yarn profile of examples module
+]
+
+ 6d60fe5 Mon Jul 1 18:24:03 2013 -0700
+ Merge pull request #666 from c0s/master
+ [hbase dependency is missed in hadoop2-yarn profile of examples module]
+
+ ccfe953 Sat Jun 29 17:57:53 2013 -0700
+ Merge pull request #577 from skumargithub/master
+ [Example of cumulative counting using updateStateByKey]
+
+ 50ca176 Thu Jun 27 22:24:52 2013 -0700
+ Merge pull request #664 from pwendell/test-fix
+ [Removing incorrect test statement]
+
+ e49bc8c Wed Jun 26 11:13:33 2013 -0700
+ Merge pull request #663 from stephenh/option_and_getenv
+ [Be cute with Option and getenv.]
+
+ f5e32ed Tue Jun 25 09:16:57 2013 -0700
+ Merge pull request #661 from mesos/streaming
+ [Kafka fixes and DStream.count fix for master]
+
+ 1249e91 Mon Jun 24 21:46:33 2013 -0700
+ Merge pull request #572 from Reinvigorate/sm-block-interval
+ [Adding spark.streaming.blockInterval property]
+
+ cfcda95 Mon Jun 24 21:44:50 2013 -0700
+ Merge pull request #571 from Reinvigorate/sm-kafka-serializers
+ [Surfacing decoders on KafkaInputDStream]
+
+ 575aff6 Mon Jun 24 21:35:50 2013 -0700
+ Merge pull request #567 from Reinvigorate/sm-count-fix
+ [Fixing count() in Spark Streaming]
+
+ 3e61bef Sat Jun 22 16:22:47 2013 -0700
+ Merge pull request #648 from shivaram/netty-dbg
+ [Shuffle fixes and cleanup]
+
+ 1ef5d0d Sat Jun 22 09:35:57 2013 -0700
+ Merge pull request #644 from shimingfei/joblogger
+ [add Joblogger to Spark (on new Spark code)]
+
+ 7e4b266 Sat Jun 22 07:53:18 2013 -0700
+ Merge pull request #563 from jey/python-optimization
+ [Optimize PySpark worker invocation]
+
+ 71030ba Wed Jun 19 15:21:03 2013 -0700
+ Merge pull request #654 from lyogavin/enhance_pipe
+ [fix typo and coding style in #638]
+
+ 73f4c7d Tue Jun 18 04:21:17 2013 -0700
+ Merge pull request #605 from esjewett/SPARK-699
+ [Add hBase example (retry of pull request #596)]
+
+ 9933836 Tue Jun 18 02:41:10 2013 -0700
+ Merge pull request #647 from jerryshao/master
+ [Reduce ZippedPartitionsRDD's getPreferredLocations complexity from O(2^2n) to O(2^n)]
+
+ db42451 Mon Jun 17 15:26:36 2013 -0700
+ Merge pull request #643 from adatao/master
+ [Bug fix: Zero-length partitions result in NaN for overall mean & variance]
+
+ e82a2ff Mon Jun 17 15:13:15 2013 -0700
+ Merge pull request #653 from rxin/logging
+ [SPARK-781: Log the temp directory path when Spark says "Failed to create temp directory."]
+
+ e6d1277 Mon Jun 17 12:56:25 2013 -0700
+ Merge pull request #638 from lyogavin/enhance_pipe
+ [Enhance pipe to support more features we can do in hadoop streaming]
+
+ f961aac Sat Jun 15 00:53:41 2013 -0700
+ Merge pull request #649 from ryanlecompte/master
+ [Add top K method to RDD using a bounded priority queue]
+
+ 6602d94 Fri Jun 14 10:41:31 2013 -0700
+ Merge pull request #651 from rxin/groupbykey
+ [SPARK-772 / SPARK-774: groupByKey and cogroup should disable map side combine]
+
+ d93851a Thu Jun 13 13:38:45 2013 -0700
+ Merge pull request #645 from pwendell/compression
+ [Adding compression to Hadoop save functions]
+
+ f1da591 Wed Jun 12 17:55:08 2013 -0700
+ Merge pull request #646 from markhamstra/jvmArgs
+ [Fixed jvmArgs in maven build.]
+
+ 0e94b73 Mon Jun 10 13:00:31 2013 -0700
+ Merge pull request #625 from stephenh/fix-start-slave
+ [Fix start-slave not passing instance number to spark-daemon.]
+
+ 74b91d5 Sat Jun 8 01:19:40 2013 -0700
+ Merge pull request #629 from c0s/master
+ [Sometime Maven build runs out of PermGen space.]
+
+ c8fc423 Fri Jun 7 22:43:18 2013 -0700
+ Merge pull request #631 from jerryshao/master
+ [Fix block manager UI display issue when enable spark.cleaner.ttl]
+
+ 1ae60bc Fri Jun 7 22:39:06 2013 -0700
+ Merge pull request #634 from xiajunluan/master
+ [[Spark-753] Fix ClusterSchedulSuite unit test failed ]
+
+ fff3728 Tue Jun 4 16:09:50 2013 -0700
+ Merge pull request #640 from pwendell/timeout-update
+ [Fixing bug in BlockManager timeout]
+
+ f420d4f Tue Jun 4 15:25:58 2013 -0700
+ Merge pull request #639 from pwendell/timeout-update
+ [Bump akka and blockmanager timeouts to 60 seconds]
+
+ 84530ba Fri May 31 17:06:13 2013 -0700
+ Merge pull request #636 from rxin/unpersist
+ [Unpersist More block manager cleanup.]
+
+ ef77bb7 Thu May 30 14:50:06 2013 -0700
+ Merge pull request #627 from shivaram/master
+ [Netty and shuffle bug fixes]
+
+ 8cb8178 Thu May 30 14:17:44 2013 -0700
+ Merge pull request #628 from shivaram/zero-block-size
+ [Skip fetching zero-sized blocks in NIO.]
+
+ 6ed7139 Wed May 29 10:14:22 2013 -0700
+ Merge pull request #626 from stephenh/remove-add-if-no-port
+ [Remove unused addIfNoPort.]
+
+ 41d230c Tue May 28 23:35:24 2013 -0700
+ Merge pull request #611 from squito/classloader
+ [Use default classloaders for akka & deserializing task results]
+
+ 3db1e17 Mon May 27 21:31:43 2013 -0700
+ Merge pull request #620 from jerryshao/master
+ [Fix CheckpointRDD java.io.FileNotFoundException when calling getPreferredLocations]
+
+ 3d4891d Sat May 25 23:38:05 2013 -0700
+ Merge pull request #621 from JoshRosen/spark-613
+ [Use ec2-metadata in start-slave.sh to detect if running on EC2]
+
+ e8d4b6c Sat May 25 21:09:03 2013 -0700
+ Merge pull request #529 from xiajunluan/master
+ [[SPARK-663]Implement Fair Scheduler in Spark Cluster Scheduler ]
+
+ 9a3c344 Sat May 25 17:53:43 2013 -0700
+ Merge pull request #624 from rxin/master
+ [NonJavaSerializableClass should not be Java serializable...]
+
+ 24e41aa Fri May 24 16:48:52 2013 -0700
+ Merge pull request #623 from rxin/master
+ [Automatically configure Netty port.]
+
+ 69161f9 Fri May 24 14:42:13 2013 -0700
+ Merge pull request #622 from rxin/master
+ [bug fix: Shuffle block iterator is ignoring the shuffle serializer setting.]
+
+ dbbedfc Thu May 23 23:11:06 2013 -0700
+ Merge pull request #616 from jey/maven-netty-exclusion
+ [Exclude old versions of Netty from Maven-based build]
+
+ a2b0a79 Tue May 21 18:16:20 2013 -0700
+ Merge pull request #619 from woggling/adjust-sampling
+ [Use ARRAY_SAMPLE_SIZE constant instead of hard-coded 100.0 in SizeEstimator]
+
+ 66dac44 Tue May 21 11:41:42 2013 -0700
+ Merge pull request #618 from woggling/dead-code-disttest
+ [DistributedSuite: remove dead code]
+
+ 5912cc4 Fri May 17 19:58:40 2013 -0700
+ Merge pull request #610 from JoshRosen/spark-747
+ [Throw exception if TaskResult exceeds Akka frame size]
+
+ 6c27c38 Thu May 16 17:33:56 2013 -0700
+ Merge pull request #615 from rxin/build-fix
+ [Maven build fix & two other small changes]
+
+ 2f576ab Wed May 15 18:06:24 2013 -0700
+ Merge pull request #602 from rxin/shufflemerge
+ [Manual merge & cleanup of Shane's Shuffle Performance Optimization]
+
+ 48c6f46 Wed May 15 10:47:19 2013 -0700
+ Merge pull request #612 from ash211/patch-4
+ [Docs: Mention spark shell's default for MASTER]
+
+ 203d7b7 Wed May 15 00:47:20 2013 -0700
+ Merge pull request #593 from squito/driver_ui_link
+ [Master UI has link to Application UI]
+
+ 016ac86 Mon May 13 21:45:36 2013 -0700
+ Merge pull request #601 from rxin/emptyrdd-master
+ [EmptyRDD (master branch 0.8)]
+
+ 4b354e0 Mon May 13 17:39:19 2013 -0700
+ Merge pull request #589 from mridulm/master
+ [Add support for instance local scheduling]
+
+ 5dbc9b2 Sun May 12 11:03:10 2013 -0700
+ Merge pull request #608 from pwendell/SPARK-738
+ [SPARK-738: Spark should detect and wrap nonserializable exceptions]
+
+ 63e1999 Fri May 10 13:54:03 2013 -0700
+ Merge pull request #606 from markhamstra/foreachPartition_fix
+ [Actually use the cleaned closure in foreachPartition]
+
+ 42bbe89 Wed May 8 22:30:31 2013 -0700
+ Merge pull request #599 from JoshRosen/spark-670
+ [Fix SPARK-670: EC2 'start' command should require -i option.]
+
+ 0f1b7a0 Wed May 8 13:38:50 2013 -0700
+ Merge pull request #596 from esjewett/master
+ [hBase example]
+
+ 7af92f2 Sat May 4 22:29:17 2013 -0700
+ Merge pull request #597 from JoshRosen/webui-fixes
+ [Two minor bug fixes for Spark Web UI]
+
+ c74ce60 Sat May 4 22:26:35 2013 -0700
+ Merge pull request #598 from rxin/blockmanager
+ [Fixed flaky unpersist test in DistributedSuite.]
+
+ 3bf2c86 Fri May 3 18:27:30 2013 -0700
+ Merge pull request #594 from shivaram/master
+ [Add zip partitions to Java API]
+
+ 2484ad7 Fri May 3 17:08:55 2013 -0700
+ Merge pull request #587 from rxin/blockmanager
+ [A set of shuffle map output related changes]
+
+ 6fe9d4e Thu May 2 21:33:56 2013 -0700
+ Merge pull request #592 from woggling/localdir-fix
+ [Don't accept generated local directory names that can't be created]
+
+ 538ee75 Thu May 2 09:01:42 2013 -0700
+ Merge pull request #581 from jerryshao/master
+ [fix [SPARK-740] block manage UI throws exception when enabling Spark Streaming]
+
+ 9abcbcc Wed May 1 22:45:10 2013 -0700
+ Merge pull request #591 from rxin/removerdd
+ [RDD.unpersist: probably the most desired feature of Spark]
+
+ aa8fe1a Tue Apr 30 22:30:18 2013 -0700
+ Merge pull request #586 from mridulm/master
+ [Pull request to address issues Reynold Xin reported]
+
+ f708dda Tue Apr 30 07:51:40 2013 -0700
+ Merge pull request #585 from pwendell/listener-perf
+ [[Fix SPARK-742] Task Metrics should not employ per-record timing by default]
+
+ 68c07ea Sun Apr 28 20:19:33 2013 -0700
+ Merge pull request #582 from shivaram/master
+ [Add zip partitions interface]
+
+ f6ee9a8 Sun Apr 28 15:36:04 2013 -0700
+ Merge pull request #583 from mridulm/master
+ [Fix issues with streaming test cases after yarn branch merge]
+
+ cf54b82 Thu Apr 25 11:45:58 2013 -0700
+ Merge pull request #580 from pwendell/quickstart
+ [SPARK-739 Have quickstart standlone job use README]
+
+ 118a6c7 Wed Apr 24 08:42:30 2013 -0700
+ Merge pull request #575 from mridulm/master
+ [Manual merge of yarn branch to trunk]
+
+ 5d8a71c Tue Apr 16 19:48:02 2013 -0700
+ Merge pull request #570 from jey/increase-codecache-size
+ [Increase ReservedCodeCacheSize for sbt]
+
+ ec5e553 Sun Apr 14 08:20:13 2013 -0700
+ Merge pull request #558 from ash211/patch-jackson-conflict
+ [Don't pull in old versions of Jackson via hadoop-core]
+
+ c1c219e Sun Apr 14 08:11:23 2013 -0700
+ Merge pull request #564 from maspotts/master
+ [Allow latest scala in PATH, with SCALA_HOME as override (instead of vice-versa)]
+
+ 7c10b3e Fri Apr 12 20:55:22 2013 -0700
+ Merge pull request #565 from andyk/master
+ [Update wording of section on RDD operations in quick start guide in docs]
+
+ 077ae0a Thu Apr 11 19:34:14 2013 -0700
+ Merge pull request #561 from ash211/patch-4
+ [Add details when BlockManager heartbeats time out]
+
+ c91ff8d Wed Apr 10 15:08:23 2013 -0700
+ Merge pull request #560 from ash211/patch-3
+ [Typos: cluser -> cluster]
+
+ 7cd83bf Tue Apr 9 22:07:35 2013 -0700
+ Merge pull request #559 from ash211/patch-example-whitespace
+ [Uniform whitespace across scala examples]
+
+ 271a4f3 Tue Apr 9 22:04:52 2013 -0700
+ Merge pull request #555 from holdenk/master
+ [Retry failed ssh commands in the ec2 python script.]
+
+ 8ac9efb Tue Apr 9 13:50:50 2013 -0700
+ Merge pull request #527 from Reinvigorate/sm-kafka-cleanup
+ [KafkaInputDStream fixes and improvements]
+
+ eed54a2 Mon Apr 8 09:44:30 2013 -0700
+ Merge pull request #553 from pwendell/akka-standalone
+ [SPARK-724 - Have Akka logging enabled by default for standalone daemons]
+
+ b362df3 Sun Apr 7 17:17:52 2013 -0700
+ Merge pull request #552 from MLnick/master
+ [Bumping version for Twitter Algebird to latest]
+
+ 4b30190 Sun Apr 7 17:15:10 2013 -0700
+ Merge pull request #554 from andyk/scala2.9.3
+ [Fixes SPARK-723 - Update build to Scala 2.9.3]
+
+ dfe98ca Tue Apr 2 19:24:12 2013 -0700
+ Merge pull request #550 from erikvanoosten/master
+ [corrected Algebird example]
+
+ b5d7830 Tue Apr 2 19:23:45 2013 -0700
+ Merge pull request #551 from jey/python-bugfixes
+ [Python bugfixes]
+
+ 2be2295 Sun Mar 31 18:09:14 2013 -0700
+ Merge pull request #548 from markhamstra/getWritableClass_filter
+ [Fixed broken filter in getWritableClass[T]]
+
+ 9831bc1 Fri Mar 29 22:16:22 2013 -0700
+ Merge pull request #539 from cgrothaus/fix-webui-workdirpath
+ [Bugfix: WorkerWebUI must respect workDirPath from Worker]
+
+ 3cc8ab6 Fri Mar 29 22:14:07 2013 -0700
+ Merge pull request #541 from stephenh/shufflecoalesce
+ [Add a shuffle parameter to coalesce.]
+
+ cad507a Fri Mar 29 22:13:12 2013 -0700
+ Merge pull request #547 from jey/maven-streaming-tests-initialization-fix
+ [Move streaming test initialization into 'before' blocks]
+
+ a98996d Fri Mar 29 22:12:15 2013 -0700
+ Merge pull request #545 from ash211/patch-1
+ [Don't use deprecated Application in example]
+
+ 104c694 Fri Mar 29 22:11:50 2013 -0700
+ Merge pull request #546 from ash211/patch-2
+ [Update tuning.md]
+
+ bc36ee4 Tue Mar 26 15:05:13 2013 -0700
+ Merge pull request #543 from holdenk/master
+ [Re-enable deprecation warnings and fix deprecated warning.]
+
+ b8949ca Sat Mar 23 07:19:34 2013 -0700
+ Merge pull request #505 from stephenh/volatile
+ [Make Executor fields volatile since they're read from the thread pool.]
+
+ fd53f2f Sat Mar 23 07:13:21 2013 -0700
+ Merge pull request #510 from markhamstra/WithThing
+ [mapWith, flatMapWith and filterWith]
+
+ 4c5efcf Wed Mar 20 19:29:23 2013 -0700
+ Merge pull request #532 from andyk/master
+ [SPARK-715: Adds instructions for building with Maven to documentation]
+
+ 3558849 Wed Mar 20 19:27:47 2013 -0700
+ Merge pull request #538 from rxin/cogroup
+ [Added mapSideCombine flag to CoGroupedRDD. Added unit test for CoGroupedRDD.]
+
+ ca4d083 Wed Mar 20 11:22:36 2013 -0700
+ Merge pull request #528 from MLnick/java-examples
+ [[SPARK-707] Adding Java versions of Pi, LogQuery and K-Means examples]
+
+ b812e6b Wed Mar 20 11:21:02 2013 -0700
+ Merge pull request #526 from markhamstra/foldByKey
+ [Add foldByKey]
+
+ 945d1e7 Tue Mar 19 21:59:06 2013 -0700
+ Merge pull request #536 from sasurfer/master
+ [CoalescedRDD for many partitions]
+
+ 1cbbe94 Tue Mar 19 21:34:34 2013 -0700
+ Merge pull request #534 from stephenh/removetrycatch
+ [Remove try/catch block that can't be hit.]
+
+ 71e53f8 Tue Mar 19 21:31:41 2013 -0700
+ Merge pull request #537 from wishbear/configurableInputFormat
+ [call setConf from input format if it is Configurable]
+
+ c1e9cdc Sat Mar 16 11:47:45 2013 -0700
+ Merge pull request #525 from stephenh/subtractByKey
+ [Add PairRDDFunctions.subtractByKey.]
+
+ cdbfd1e Fri Mar 15 15:13:28 2013 -0700
+ Merge pull request #516 from squito/fix_local_metrics
+ [Fix local metrics]
+
+ f9fa2ad Fri Mar 15 15:12:43 2013 -0700
+ Merge pull request #530 from mbautin/master-update-log4j-and-make-compile-in-IntelliJ
+ [Add a log4j compile dependency to fix build in IntelliJ]
+
+ 4032beb Wed Mar 13 19:29:46 2013 -0700
+ Merge pull request #521 from stephenh/earlyclose
+ [Close the reader in HadoopRDD as soon as iteration end.]
+
+ 3c97276 Wed Mar 13 19:25:08 2013 -0700
+ Merge pull request #524 from andyk/master
+ [Fix broken link to YARN documentation]
+
+ 1c3d981 Wed Mar 13 19:23:48 2013 -0700
+ Merge pull request #517 from Reinvigorate/sm-build-fixes
+ [Build fixes for streaming /w SBT]
+
+ 2d477fd Wed Mar 13 06:49:16 2013 -0700
+ Merge pull request #523 from andyk/master
+ [Fix broken link in Quick Start]
+
+ 00c4d23 Tue Mar 12 22:19:00 2013 -0700
+ Merge pull request #518 from woggling/long-bm-sizes
+ [Send block sizes as longs in BlockManager updates]
+
+ cbf8f0d Mon Mar 11 00:23:57 2013 -0700
+ Merge pull request #513 from MLnick/bagel-caching
+ [Adds choice of persistence level to Bagel.]
+
+ 91a9d09 Sun Mar 10 15:48:23 2013 -0700
+ Merge pull request #512 from patelh/fix-kryo-serializer
+ [Fix reference bug in Kryo serializer, add test, update version]
+
+ 557cfd0 Sun Mar 10 15:44:57 2013 -0700
+ Merge pull request #515 from woggling/deploy-app-death
+ [Notify standalone deploy client of application death.]
+
+ 04fb81f Sun Mar 3 17:20:07 2013 -0800
+ Merge pull request #506 from rxin/spark-706
+ [Fixed SPARK-706: Failures in block manager put leads to read task hanging.]
+
+ 6cf4be4 Sun Mar 3 17:16:22 2013 -0800
+ Merge pull request #462 from squito/stageInfo
+ [Track assorted metrics for each task, report summaries to user at stage completion]
+
+ 6bfc7ca Sat Mar 2 22:14:49 2013 -0800
+ Merge pull request #504 from mosharaf/master
+ [Worker address was getting removed when removing an app.]
+
+ 94b3db1 Sat Mar 2 22:13:52 2013 -0800
+ Merge pull request #508 from markhamstra/TestServerInUse
+ [Avoid bind failure in InputStreamsSuite]
+
+ 25c71d3 Fri Mar 1 08:00:18 2013 -0800
+ Merge pull request #507 from markhamstra/poms271
+ [bump version to 0.7.1-SNAPSHOT in the subproject poms]
+
diff --git a/dev/create-release/generate-changelist.py b/dev/create-release/generate-changelist.py
index 2e1a35a629..916ec90f05 100755
--- a/dev/create-release/generate-changelist.py
+++ b/dev/create-release/generate-changelist.py
@@ -31,8 +31,8 @@ import time
import traceback
SPARK_HOME = os.environ["SPARK_HOME"]
-NEW_RELEASE_VERSION = "1.0.0"
-PREV_RELEASE_GIT_TAG = "v0.9.1"
+NEW_RELEASE_VERSION = "1.1.0"
+PREV_RELEASE_GIT_TAG = "v1.0.0"
CHANGELIST = "CHANGES.txt"
OLD_CHANGELIST = "%s.old" % (CHANGELIST)