Commit fb66cbd

committed

modify word2vec

1 parent 58a202f commit fb66cbdCopy full SHA for fb66cbd

File tree

1 file changed

-7

lines changed

word2vec.py

1 file changed

-7

lines changed

`‎word2vec.py‎`

Lines changed: 9 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -7,8 +7,9 @@`
`7`	`7`
`8`	`8`
`9`	`9`	`class Word2Vec:`
`10`		`- def __init__(self, batch_size=128, num_skips=2, skip_window=1, vocab_size=constant.VOCAB_SIZE, embed_size=50,`
	`10`	`+ def __init__(self, output, batch_size=128, num_skips=2, skip_window=1, vocab_size=constant.VOCAB_SIZE, embed_size=50,`
`11`	`11`	`num_sampled=64, steps=100000):`
	`12`	`+ self.output = output`
`12`	`13`	`self.batch_size = batch_size`
`13`	`14`	`self.num_skips = num_skips`
`14`	`15`	`self.skip_window = skip_window`
`@@ -51,9 +52,9 @@ def train(self):`
`51`	`52`	`# The average loss is an estimate of the loss over the last 2000 batches.`
`52`	`53`	`print("Average loss at step ", step, ": ", aver_loss)`
`53`	`54`	`aver_loss = 0`
`54`		`- np.save('tmp/embed',self.embeddings.eval())`
`55`		`-#self.test(sess)`
`56`		`- def test(self,sess):`
	`55`	`+ np.save(self.output, self.embeddings.eval())`
	`56`	`+`
	`57`	`+ def test(self):`
`57`	`58`	`valid_dataset = [3021]`
`58`	`59`	`norm = tf.sqrt(tf.reduce_sum(tf.square(self.embeddings), 1, keep_dims=True))`
`59`	`60`	`normalized_embeddings = self.embeddings / norm`
`@@ -62,10 +63,11 @@ def test(self,sess):`
`62`	`63`	`similarity = tf.abs(tf.matmul(`
`63`	`64`	`valid_embeddings, normalized_embeddings, transpose_b=True))`
`64`	`65`	`print(similarity.eval())`
`65`		`- pair = zip(range(self.vocab_size),similarity.eval()[0])`
	`66`	`+ pair = zip(range(self.vocab_size),similarity.eval()[0])`
`66`	`67`	`spair = sorted(pair, key=lambda x: x[1])`
`67`	`68`	`print(spair[0:10])`
`68`	`69`
	`70`	`+`
`69`	`71`	`if __name__ == '__main__':`
`70`		`- w2v = Word2Vec()`
`71`		`- w2v.train()`
	`72`	`+ w2v = Word2Vec('corpus/lstm/embeddings', embed_size=100)`
	`73`	`+ w2v.train()`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit fb66cbd

File tree

1 file changed

1 file changed

`‎word2vec.py‎`

0 commit comments