Skip to content

Commit

Permalink
Merge branch 'SPARK-4586' of github.com:mengxr/spark into ml
Browse files Browse the repository at this point in the history
  • Loading branch information
Davies Liu committed Jan 28, 2015
2 parents 1dca16a + fc59a02 commit 78638df
Showing 1 changed file with 4 additions and 2 deletions.
6 changes: 4 additions & 2 deletions python/pyspark/ml/feature.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,8 @@
@inherit_doc
class Tokenizer(JavaTransformer, HasInputCol, HasOutputCol):
"""
A tokenizer that converts the input string to lowercase and then splits it by white spaces.
A tokenizer that converts the input string to lowercase and then
splits it by white spaces.
>>> from pyspark.sql import Row
>>> dataset = sqlCtx.inferSchema(sc.parallelize([Row(text="a b c")]))
Expand All @@ -44,7 +45,8 @@ class Tokenizer(JavaTransformer, HasInputCol, HasOutputCol):
@inherit_doc
class HashingTF(JavaTransformer, HasInputCol, HasOutputCol, HasNumFeatures):
"""
Maps a sequence of terms to their term frequencies using the hashing trick.
Maps a sequence of terms to their term frequencies using the
hashing trick.
>>> from pyspark.sql import Row
>>> dataset = sqlCtx.inferSchema(sc.parallelize([Row(words=["a", "b", "c"])]))
Expand Down

0 comments on commit 78638df

Please sign in to comment.