Skip to content

Commit 4ec985e

Browse files
author
sungjin.712
committed
change name
1 parent 503ee73 commit 4ec985e

10 files changed

+36
-4
lines changed
File renamed without changes.
File renamed without changes.

7.PRETRAIN_METHOD/7.2.bert_finetune-KOR_NSMC.ipynb renamed to 7.PRETRAIN_METHOD/7.2.bert_finetune-NSMC.ipynb

Lines changed: 35 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@
4848
"tf.random.set_seed(1234)\n",
4949
"np.random.seed(1234)\n",
5050
"\n",
51-
"BATCH_SIZE = 256\n",
51+
"BATCH_SIZE = 32\n",
5252
"NUM_EPOCHS = 3\n",
5353
"VALID_SPLIT = 0.2\n",
5454
"MAX_LEN = 39 # EDA에서 추출된 Max Length\n",
@@ -58,7 +58,7 @@
5858
},
5959
{
6060
"cell_type": "code",
61-
"execution_count": 5,
61+
"execution_count": 4,
6262
"metadata": {},
6363
"outputs": [],
6464
"source": [
@@ -74,7 +74,7 @@
7474
},
7575
{
7676
"cell_type": "code",
77-
"execution_count": 6,
77+
"execution_count": 5,
7878
"metadata": {},
7979
"outputs": [
8080
{
@@ -96,6 +96,38 @@
9696
"print(token_print)"
9797
]
9898
},
99+
{
100+
"cell_type": "code",
101+
"execution_count": 7,
102+
"metadata": {},
103+
"outputs": [
104+
{
105+
"name": "stdout",
106+
"output_type": "stream",
107+
"text": [
108+
"[101, 9521, 118741, 35506, 24982, 48549, 117, 9321, 118610, 119081, 48345, 102]\n",
109+
"[101, 31178, 11356, 102]\n",
110+
"[CLS] 안녕하세요, 반갑습니다 [SEP]\n",
111+
"[CLS] Hello world [SEP]\n"
112+
]
113+
}
114+
],
115+
"source": [
116+
"kor_encode = tokenizer.encode(\"안녕하세요, 반갑습니다\")\n",
117+
"eng_encode = tokenizer.encode(\"Hello world\")\n",
118+
"kor_decode = tokenizer.decode(kor_encode)\n",
119+
"eng_decode = tokenizer.decode(eng_encode)\n",
120+
"\n",
121+
"print(kor_encode)\n",
122+
"# [101, 9521, 118741, 35506, 24982, 48549, 117, 9321, 118610, 119081, 48345, 102]\n",
123+
"print(eng_encode)\n",
124+
"# [101, 31178, 11356, 102]\n",
125+
"print(kor_decode)\n",
126+
"# [CLS] 안녕하세요, 반갑습니다 [SEP]\n",
127+
"print(eng_decode)\n",
128+
"# [CLS] Hello world [SEP]"
129+
]
130+
},
99131
{
100132
"cell_type": "markdown",
101133
"metadata": {},

7.PRETRAIN_METHOD/7.2_bert_finetune-KorNER.ipynb renamed to 7.PRETRAIN_METHOD/7.2_bert_finetune-NER.ipynb

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@
5252
"tf.random.set_seed(1234)\n",
5353
"np.random.seed(1234)\n",
5454
"\n",
55-
"BATCH_SIZE = 2\n",
55+
"BATCH_SIZE = 32\n",
5656
"NUM_EPOCHS = 3\n",
5757
"MAX_LEN = 111 # EDA에서 추출된 Max Length\n",
5858
"DATA_IN_PATH = 'data_in/KOR'\n",

0 commit comments

Comments
 (0)