{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "

\n", "# **자연어와 Deep Learning**\n", "## **LSTM 단어 알파벳 완성모델**\n", "\n", "

\n", "## **1 데이터 정의**" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "import tensorflow as tf\n", "import numpy as np\n", "char_arr = ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', \n", " 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z']\n", "num_dic = {n: i for i, n in enumerate(char_arr)}\n", "dic_len = len(num_dic)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "def make_batch(seq_data):\n", " input_batch, target_batch = [], []\n", " for seq in seq_data: \n", " input_num = [num_dic[n] for n in seq[:-1]] \n", " target = num_dic[seq[-1]] \n", " input_batch.append(np.eye(dic_len)[input_num])\n", " target_batch.append(target) \n", " return input_batch, target_batch" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "

\n", "## **2 모델의 정의**" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "tf.reset_default_graph()\n", "learning_rate = 0.01\n", "n_step = 3 \n", "n_hidden, total_epoch = 64, 30\n", "n_input = n_class = dic_len" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "X = tf.placeholder(tf.float32, [None, n_step, n_input])\n", "Y = tf.placeholder(tf.int32, [None])\n", "\n", "W = tf.Variable(tf.random_normal([n_hidden, n_class])) \n", "b = tf.Variable(tf.random_normal([n_class]))" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "cell1 = tf.nn.rnn_cell.BasicLSTMCell(n_hidden)\n", "cell1 = tf.nn.rnn_cell.DropoutWrapper(cell1, output_keep_prob=0.5) \n", "cell2 = tf.nn.rnn_cell.BasicLSTMCell(n_hidden) \n", "multi_cell = tf.nn.rnn_cell.MultiRNNCell([cell1, cell2])" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "outputs, states = tf.nn.dynamic_rnn(multi_cell, X, dtype=tf.float32)\n", "outputs = tf.transpose(outputs, [1, 0, 2])\n", "outputs = outputs[-1]\n", "model = tf.matmul(outputs, W) + b" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "cost = tf.reduce_mean(tf.nn.sparse_softmax_cross_entropy_with_logits(\n", " logits = model, labels = Y))\n", "optimizer = tf.train.AdamOptimizer(learning_rate).minimize(cost)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "

\n", "## **3 모델의 학습**" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "%%time\n", "seq_data = ['word', 'wood', 'deep', 'dive', 'cold', 'cool', 'load', 'love', 'kiss', 'kind']\n", "\n", "sess = tf.Session()\n", "sess.run(tf.global_variables_initializer())\n", "input_batch, target_batch = make_batch(seq_data)\n", "for epoch in range(total_epoch):\n", " _, loss = sess.run([optimizer, cost],\n", " feed_dict={X: input_batch, Y: target_batch})\n", " if epoch % 4 == 0:\n", " print('Epoch: {:.4f} cost = {:.6f}'.format(epoch + 1, loss))\n", "print('최적화 완료!')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "

\n", "## **4 학습 모델의 평가**" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "%%time\n", "prediction = tf.cast(tf.argmax(model, 1), tf.int32)\n", "prediction_check = tf.equal(prediction, Y) \n", "accuracy = tf.reduce_mean(tf.cast(prediction_check, tf.float32))\n", "\n", "input_batch, target_batch = make_batch(seq_data)\n", "predict, accuracy_val = sess.run([prediction, accuracy],\n", " feed_dict={X: input_batch, Y: target_batch})" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "predict_words = []\n", "for idx, val in enumerate(seq_data):\n", " last_char = char_arr[predict[idx]]\n", " predict_words.append(val[:3] + last_char)\n", "\n", "print('\\n=== 예측 결과 ===')\n", "print('입력값:', [w[:-1] + ' ' for w in seq_data])\n", "print('예측값:', predict_words)\n", "print('정확도:', accuracy_val)\n", "sess.close()" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.3" } }, "nbformat": 4, "nbformat_minor": 2 }