Я пишу функцию для сравнения сходства двух строк, используя универсальный кодировщик предложений Google . Следуя инструкциям в записной книжке здесь У меня в классе есть следующий метод, который принимает два предложения и выводит сходство между ними.
def tf_sim(self, text1, text2):
# Reduce logging output.
tf.logging.set_verbosity(tf.logging.ERROR)
sim_input1 = tf.placeholder(tf.string, shape=(None), name="sim_input1")
sim_input2 = tf.placeholder(tf.string, shape=(None), name="sim_input2")
embedding1 = self.embed([sim_input1])
embedding2 = self.embed([sim_input2])
encode1 = tf.nn.l2_normalize(embedding1, axis=1)
encode2 = tf.nn.l2_normalize(embedding2, axis=1)
sim_scores = -tf.acos(tf.reduce_sum(tf.multiply(encode1, encode2), axis=1))
init_vars = tf.global_variables_initializer()
init_tables = tf.tables_initializer()
with tf.Session() as sess:
sess.run([init_vars, init_tables])
sess.run(sim_scores, feed_dict={sim_input1: text1, sim_input2: text2})
print (sim_scores.eval())
Для справки атрибут self.embed выглядит так:
self.embed = hub.Module("https://tfhub.dev/google/universal-sentence-encoder/2")
Когда я вызываю функцию:
str1 = "Is Python a better first language to learn than Java"
str2 = "Which of Python or Java is a better programming language to
start out with"
tf_sim(str1, str2)
Я получаю следующую трассировку стека:
Traceback (most recent call last):
File "SimilarityCalculator.py", line 143, in <module>
sc.tf_sim(str1, str2)
File "SimilarityCalculator.py", line 67, in tf_sim
print (sim_scores.eval())
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 710, in eval
return _eval_using_default_session(self, feed_dict, self.graph, session)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 5180, in _eval_using_default_session
return session.run(tensors, feed_dict)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/client/session.py", line 900, in run
run_metadata_ptr)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/client/session.py", line 1135, in _run
feed_dict_tensor, options, run_metadata)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/client/session.py", line 1316, in _do_run
run_metadata)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/client/session.py", line 1335, in _do_call
raise type(e)(node_def, op, message)
tensorflow.python.framework.errors_impl.InvalidArgumentError: You must feed a value for placeholder tensor 'sim_input1' with dtype string
[[Node: sim_input1 = Placeholder[dtype=DT_STRING, shape=<unknown>, _device="/job:localhost/replica:0/task:0/device:CPU:0"]()]]
Caused by op 'sim_input1', defined at:
File "SimilarityCalculator.py", line 143, in <module>
sc.tf_sim(str1, str2)
File "SimilarityCalculator.py", line 40, in tf_sim
sim_input1 = tf.placeholder(tf.string, shape=(None), name="sim_input1")
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/ops/array_ops.py", line 1808, in placeholder
return gen_array_ops.placeholder(dtype=dtype, shape=shape, name=name)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/ops/gen_array_ops.py", line 4848, in placeholder
"Placeholder", dtype=dtype, shape=shape, name=name)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py", line 787, in _apply_op_helper
op_def=op_def)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 3392, in create_op
op_def=op_def)
File "/Users/kaushik.visvanathan/anaconda3/envs/Community/lib/python3.6/site-packages/tensorflow/python/framework/ops.py", line 1718, in __init__
self._traceback = self._graph._extract_stack() # pylint: disable=protected-access
InvalidArgumentError (see above for traceback): You must feed a value for placeholder tensor 'sim_input1' with dtype string
[[Node: sim_input1 = Placeholder[dtype=DT_STRING, shape=<unknown>, _device="/job:localhost/replica:0/task:0/device:CPU:0"]()]]
В сущности, мне нужно передать строку заполнителю, хотя, похоже, я это делаю. Я что-то пропустил? Любая помощь с благодарностью!