From e3d501c66d209716d2fcc97c993116df9abd35c7 Mon Sep 17 00:00:00 2001 From: Aneesh Panoli Date: Sun, 26 Apr 2020 16:05:53 -0700 Subject: [PATCH] scan_vocab is depricated --- docs/notebooks/doc2vec-wikipedia.ipynb | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/docs/notebooks/doc2vec-wikipedia.ipynb b/docs/notebooks/doc2vec-wikipedia.ipynb index ff4786d3fd..a645ec8ec1 100644 --- a/docs/notebooks/doc2vec-wikipedia.ipynb +++ b/docs/notebooks/doc2vec-wikipedia.ipynb @@ -90,7 +90,7 @@ " self.wiki.metadata = True\n", " def __iter__(self):\n", " for content, (page_id, title) in self.wiki.get_texts():\n", - " yield TaggedDocument([c.decode(\"utf-8\") for c in content], [title])" + " yield TaggedDocument(content, [title]) # python3" ] }, { @@ -121,7 +121,7 @@ "outputs": [], "source": [ "pre = Doc2Vec(min_count=0)\n", - "pre.scan_vocab(documents)" + "pre.build_vocab(documents)" ] }, {