From f74d0d9ce6b3d4cdd6e99b8e84735ef0cd7406a4 Mon Sep 17 00:00:00 2001
From: YPBlib <ypb1024@foxmail.com>
Date: Wed, 11 Jul 2018 12:37:49 +0800
Subject: [PATCH 1/2] first commit

---
 README.md | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 7ea282b..81b39f0 100644
--- a/README.md
+++ b/README.md
@@ -116,6 +116,8 @@ python train_wc.py --train_file ./data/np/train.txt.iobes --dev_file ./data/np/t
 
 For other datasets or tasks, you may wanna try different stopping parameters, especially, for smaller dataset, you may want to set ```least_iters``` to a larger value; and for some tasks, if the speed of loss decreasing is too slow, you may want to increase ```lr```.
 
+
+
 ## Benchmarks
 
 Here we compare LM-LSTM-CRF with recent state-of-the-art models on the CoNLL 2000 Chunking dataset, the CoNLL 2003 NER dataset, and the WSJ portion of the PTB POS Tagging dataset. All experiments are conducted on a GTX 1080 GPU.
@@ -150,8 +152,8 @@ We released pre-trained models on these three tasks. The checkpoint file can be
 
 | WSJ-PTB POS Tagging |  CoNLL03 NER |
 | ------------------- |
-| [Args](https://drive.google.com/a/illinois.edu/file/d/0B587SdKqutQmN1UwNjhHQkhUWEk/view?usp=sharing) | [Args](https://drive.google.com/file/d/1tGAQ0hu9AsIBdrqFn5fmDQ72Pk1I-o74/view?usp=sharing) | 
-| [Model](https://drive.google.com/a/illinois.edu/file/d/0B587SdKqutQmSDlJRGRNandhMGs/view?usp=sharing) | [Model](https://drive.google.com/file/d/1o9kjZV5EcHAhys3GPgl7EPGE5fuXyYjr/view?usp=sharing) | 
+| [Args](https://drive.google.com/a/illinois.edu/file/d/0B587SdKqutQmN1UwNjhHQkhUWEk/view?usp=sharing) | [Args](https://drive.google.com/file/d/1tGAQ0hu9AsIBdrqFn5fmDQ72Pk1I-o74/view?usp=sharing) |
+| [Model](https://drive.google.com/a/illinois.edu/file/d/0B587SdKqutQmSDlJRGRNandhMGs/view?usp=sharing) | [Model](https://drive.google.com/file/d/1o9kjZV5EcHAhys3GPgl7EPGE5fuXyYjr/view?usp=sharing) |
 
 Also, ```eval_wc.py``` is provided to load and run these checkpoints. Its usage can be accessed by command ````python eval_wc.py -h````, and a running command example is provided below:
 ```

From d396510fb5a294711a41727aac11346829303887 Mon Sep 17 00:00:00 2001
From: YPBlib <ypb1024@foxmail.com>
Date: Fri, 13 Jul 2018 06:43:03 +0800
Subject: [PATCH 2/2] emmm

---
 model/utils.py |  4 +++-
 train_w.py     | 17 ++++++++++-------
 2 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/model/utils.py b/model/utils.py
index 05018e9..8599ad6 100644
--- a/model/utils.py
+++ b/model/utils.py
@@ -5,6 +5,8 @@
 .. moduleauthor:: Liyuan Liu, Frank Xu
 """
 
+
+
 import codecs
 import csv
 import itertools
@@ -419,7 +421,7 @@ def load_embedding_wlm(emb_file, delimiter, feature_map, full_feature_set, casel
     outdoc_embedding_array = list()
     outdoc_word_array = list()
 
-    for line in open(emb_file, 'r'):
+    for line in codecs.open(emb_file, 'r','utf-8'):
         line = line.split(delimiter)
         vector = list(map(lambda t: float(t), filter(lambda n: n and not n.isspace(), line[1:])))
 
diff --git a/train_w.py b/train_w.py
index 4779abf..146ffc6 100644
--- a/train_w.py
+++ b/train_w.py
@@ -22,10 +22,10 @@
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(description='Learning with BLSTM-CRF')
     parser.add_argument('--rand_embedding', action='store_true', help='random initialize word embedding')
-    parser.add_argument('--emb_file', default='./embedding/glove.6B.100d.txt', help='path to pre-trained embedding')
-    parser.add_argument('--train_file', default='./data/ner2003/eng.train.iobes', help='path to training file')
-    parser.add_argument('--dev_file', default='./data/ner2003/eng.testa.iobes', help='path to development file')
-    parser.add_argument('--test_file', default='./data/ner2003/eng.testb.iobes', help='path to test file')
+    parser.add_argument('--emb_file', default='./data/glove.6B.100d.txt', help='path to pre-trained embedding')
+    parser.add_argument('--train_file', default='./data/ner2003/eng.train', help='path to training file')
+    parser.add_argument('--dev_file', default='./data/ner2003/eng.testa', help='path to development file')
+    parser.add_argument('--test_file', default='./data/ner2003/eng.testb', help='path to test file')
     parser.add_argument('--gpu', type=int, default=0, help='gpu id, set to -1 if use cpu mode')
     parser.add_argument('--batch_size', type=int, default=10, help='batch size (10)')
     parser.add_argument('--unk', default='unk', help='unknow-token in pre-trained embedding')
@@ -56,8 +56,8 @@
     if args.gpu >= 0:
         torch.cuda.set_device(args.gpu)
 
-    print('setting:')
-    print(args)
+   # print('setting:')
+ #   print(args)
 
     # load corpus
     print('loading corpus')
@@ -180,7 +180,10 @@
                 itertools.chain.from_iterable(dataset_loader), mininterval=2,
                 desc=' - Tot it %d (epoch %d)' % (tot_length, args.start_epoch), leave=False, file=sys.stdout):
 
-            fea_v, tg_v, mask_v = packer.repack_vb(feature, tg, mask)
+            #fea_v, tg_v, mask_v = packer.repack_vb(feature, tg, mask)
+            fea_v, tg_v, mask_v = packer.repack_vb(feature.type(torch.FloatTensor), tg.type(torch.FloatTensor),
+             mask.type(torch.FloatTensor))
+
             ner_model.zero_grad()
             scores, hidden = ner_model.forward(fea_v)
             loss = crit.forward(scores, tg_v, mask_v)