wangzhen38
diff --git a/‎doc/pre_train_model.md
+20-2 b/‎doc/pre_train_model.md
+20-2
diff --git a/‎doc/yaml.md
+2 b/‎doc/yaml.md
+2
diff --git a/‎models/contentunderstanding/readme.md
+6-6 b/‎models/contentunderstanding/readme.md
+6-6
diff --git a/‎models/contentunderstanding/classification/__init__.py ‎models/contentunderstanding/textcnn/__init__.py b/‎models/contentunderstanding/classification/__init__.py ‎models/contentunderstanding/textcnn/__init__.py
diff --git a/‎models/contentunderstanding/classification/config.yaml ‎models/contentunderstanding/textcnn/config.yaml
+1-1 b/‎models/contentunderstanding/classification/config.yaml ‎models/contentunderstanding/textcnn/config.yaml
+1-1
diff --git a/‎models/contentunderstanding/classification/data/preprocess.py ‎models/contentunderstanding/textcnn/data/preprocess.py b/‎models/contentunderstanding/classification/data/preprocess.py ‎models/contentunderstanding/textcnn/data/preprocess.py
diff --git a/‎models/contentunderstanding/classification/data/test/test.txt ‎models/contentunderstanding/textcnn/data/test/test.txt b/‎models/contentunderstanding/classification/data/test/test.txt ‎models/contentunderstanding/textcnn/data/test/test.txt
diff --git a/‎models/contentunderstanding/classification/data/train/train.txt ‎models/contentunderstanding/textcnn/data/train/train.txt b/‎models/contentunderstanding/classification/data/train/train.txt ‎models/contentunderstanding/textcnn/data/train/train.txt
diff --git a/‎models/contentunderstanding/classification/model.py ‎models/contentunderstanding/textcnn/model.py b/‎models/contentunderstanding/classification/model.py ‎models/contentunderstanding/textcnn/model.py
diff --git a/‎models/contentunderstanding/classification/reader.py ‎models/contentunderstanding/textcnn/reader.py b/‎models/contentunderstanding/classification/reader.py ‎models/contentunderstanding/textcnn/reader.py
diff --git a/‎models/contentunderstanding/classification/readme.md ‎models/contentunderstanding/textcnn/readme.md
+4-5 b/‎models/contentunderstanding/classification/readme.md ‎models/contentunderstanding/textcnn/readme.md
+4-5
diff --git a/‎models/contentunderstanding/textcnn_pretrain/__init__.py
+13 b/‎models/contentunderstanding/textcnn_pretrain/__init__.py
+13
diff --git a/‎models/contentunderstanding/textcnn_pretrain/basemodel.py
+118 b/‎models/contentunderstanding/textcnn_pretrain/basemodel.py
+118
diff --git a/‎models/contentunderstanding/textcnn_pretrain/config.yaml
+70 b/‎models/contentunderstanding/textcnn_pretrain/config.yaml
+70
@@ -7,9 +7,27 @@ PaddleRec基于业务实践，使用真实数据，产出了推荐领域算法
 ### 获取地址
 
 ```bash
-wget xxx.tar.gz
+wget https://paddlerec.bj.bcebos.com/textcnn_pretrain%2Fpretrain_model.tar.gz
 ```
 
 ### 使用方法
 
-解压后，得到的是一个paddle的模型文件夹，使用`PaddleRec/models/contentunderstanding/classification_finetue`模型进行加载
+解压后，得到的是一个paddle的模型文件夹，使用`PaddleRec/models/contentunderstanding/textcnn`模型进行加载  
+您可以在PaddleRec/models/contentunderstanding/textcnn_pretrain中找到finetune_startup.py文件，在config.yaml中配置startup_class_path和init_pretraining_model_path两个参数。  
+在参数startup_class_path中配置finetune_startup.py文件的地址，在init_pretraining_model_path参数中配置您要加载的参数文件。  
+以textcnn_pretrain为例，配置完的runner如下：
+```
+runner:
+- name: train_runner
+  class: train
+  epochs: 6
+  device: cpu
+  save_checkpoint_interval: 1
+  save_checkpoint_path: "increment"
+  init_model_path: "" 
+  print_interval: 10
+  startup_class_path: "{workspace}/finetune_startup.py"
+  init_pretraining_model_path: "{workspace}/pretrain_model/pretrain_model_params"
+  phases: phase_train
+```
+具体使用方法请参照textcnn[使用预训练模型进行finetune](https://github.com/PaddlePaddle/PaddleRec/tree/master/models/contentunderstanding/textcnn_pretrain)
@@ -37,6 +37,8 @@
 |      startup_class_path       |    string    |                           路径                            |    否    |                     自定义startup流程实现的地址                      |
 |       runner_class_path       |    string    |                           路径                            |    否    |                      自定义runner流程实现的地址                      |
 |      terminal_class_path      |    string    |                           路径                            |    否    |                     自定义terminal流程实现的地址                     |
+|  init_pretraining_model_path  |    string    |                           路径                            |    否    |自定义的startup流程中需要传入这个参数，finetune中需要加载的参数的地址 |
+
 
 
 
 
@@ -1,7 +1,7 @@
 # 内容理解模型库
 
 ## 简介
-我们提供了常见的内容理解任务中使用的模型算法的PaddleRec实现, 单机训练&预测效果指标以及分布式训练&预测性能指标等。实现的内容理解模型包括 [Tagspace](tagspace)、[文本分类](classification)等。
+我们提供了常见的内容理解任务中使用的模型算法的PaddleRec实现, 单机训练&预测效果指标以及分布式训练&预测性能指标等。实现的内容理解模型包括 [Tagspace](tagspace)、[文本分类](textcnn)、[基于textcnn的预训练模型](textcnn_pretrain)等。
 
 模型算法库在持续添加中，欢迎关注。
 
@@ -23,7 +23,7 @@
 |       模型        |       简介        |       论文        |
 | :------------------: | :--------------------: | :---------: |
 | TagSpace | 标签推荐 | [EMNLP 2014][TagSpace: Semantic Embeddings from Hashtags](https://www.aclweb.org/anthology/D14-1194.pdf) |
-| Classification | 文本分类 | [EMNLP 2014][Convolutional neural networks for sentence classication](https://www.aclweb.org/anthology/D14-1181.pdf) |
+| textcnn | 文本分类 | [EMNLP 2014][Convolutional neural networks for sentence classication](https://www.aclweb.org/anthology/D14-1181.pdf) |
 
 下面是每个模型的简介（注：图片引用自链接中的论文）
 
@@ -32,7 +32,7 @@
 <img align="center" src="../../doc/imgs/tagspace.png">
 <p>
 
-[文本分类CNN模型](https://www.aclweb.org/anthology/D14-1181.pdf)
+[textCNN模型](https://www.aclweb.org/anthology/D14-1181.pdf)
 <p align="center">
 <img align="center" src="../../doc/imgs/cnn-ckim2014.png">
 <p>
@@ -42,7 +42,7 @@
 git clone https://github.com/PaddlePaddle/PaddleRec.git paddle-rec
 cd PaddleRec
 python -m paddlerec.run -m models/contentunderstanding/tagspace/config.yaml
-python -m paddlerec.run -m models/contentunderstanding/classification/config.yaml
+python -m paddlerec.run -m models/contentunderstanding/textcnn/config.yaml
 ```
 
 ## 使用教程（复现论文）
@@ -134,7 +134,7 @@ batch: 13, acc: [0.928], loss: [0.01736144]
 batch: 14, acc: [0.93], loss: [0.01911209]
 ```
 
-**（2）Classification**
+**（2）textcnn**
 
 ### 数据处理
 情感倾向分析（Sentiment Classification，简称Senta）针对带有主观描述的中文文本，可自动判断该文本的情感极性类别并给出相应的置信度。情感类型分为积极、消极。情感倾向分析能够帮助企业理解用户消费习惯、分析热点话题和危机舆情监控，为企业提供有利的决策支持。  
@@ -206,4 +206,4 @@ batch: 3, acc: [0.90234375], loss: [0.27907994]
 |       数据集        |       模型       |       loss         |       acc         |
 | :------------------: | :--------------------: | :---------: |:---------: | 
 |       ag news dataset        |       TagSpace       |       0.0198        |       0.9177          | 
-|       ChnSentiCorp        |       Classification       |       0.2282        |        0.9127         | 
+|       ChnSentiCorp        |       textcnn       |       0.2282        |        0.9127         | 
@@ -12,7 +12,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-workspace: "models/contentunderstanding/classification"
+workspace: "models/contentunderstanding/textcnn"
 
 dataset:
 - name: data1
 
@@ -1,11 +1,11 @@
-# classification文本分类模型
+# textcnn文本分类模型
 
 以下是本例的简要目录结构及说明： 
 
 ```
 ├── data #样例数据
     ├── train
-         ├── train.txt #训练数据样例
+        ├── train.txt #训练数据样例
     ├── test
         ├── test.txt #测试数据样例
     ├── preprocess.py #数据处理程序
@@ -15,7 +15,6 @@
 ├── config.yaml #配置文件
 ├── reader.py #读取程序
 ```
-
 注：在阅读该示例前，建议您先了解以下内容：
 [paddlerec入门教程](https://github.com/PaddlePaddle/PaddleRec/blob/master/README.md)  
 
@@ -73,13 +72,13 @@ os : windows/linux/macos
 本文提供了样例数据可以供您快速体验，在paddlerec目录下直接执行下面的命令即可启动训练： 
 
 ```
-python -m paddlerec.run -m models/contentunderstanding/classification/config.yaml
+python -m paddlerec.run -m models/contentunderstanding/textcnn/config.yaml
 ```   
 
 
 ## 效果复现
 为了方便使用者能够快速的跑通每一个模型，我们在每个模型下都提供了样例数据。如果需要复现readme中的效果,请按如下步骤依次操作即可。  
-1. 确认您当前所在目录为PaddleRec/models/contentunderstanding/classification  
+1. 确认您当前所在目录为PaddleRec/models/contentunderstanding/textcnn  
 2. 下载并解压数据集，命令如下：  
 ``` 
 wget https://baidu-nlp.bj.bcebos.com/sentiment_classification-dataset-1.0.0.tar.gz
 
@@ -0,0 +1,13 @@
+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
@@ -0,0 +1,118 @@
+#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import paddle.fluid as fluid
+from paddlerec.core.utils import envs
+from paddlerec.core.model import ModelBase
+from paddlerec.core.metrics import RecallK
+
+
+class Model(ModelBase):
+    def __init__(self, config):
+        ModelBase.__init__(self, config)
+        self.dict_size = 2000000 + 1
+        self.max_seq_len = 1024
+        self.emb_dim = 128
+        self.cnn_hid_dim = 128
+        self.cnn_win_size = 3
+        self.cnn_win_size2 = 5
+        self.hid_dim1 = 96
+        self.class_dim = 30
+        self.is_sparse = True
+
+    def input_data(self, is_infer=False, **kwargs):
+
+        text = fluid.data(
+            name="text", shape=[None, self.max_seq_len, 1], dtype='int64')
+        label = fluid.data(name="category", shape=[None, 1], dtype='int64')
+        seq_len = fluid.data(name="seq_len", shape=[None], dtype='int64')
+        return [text, label, seq_len]
+
+    def net(self, inputs, is_infer=False):
+        """ network definition """
+        #text label
+        self.data = inputs[0]
+        self.label = inputs[1]
+        self.seq_len = inputs[2]
+        emb = embedding(self.data, self.dict_size, self.emb_dim,
+                        self.is_sparse)
+        concat = multi_convs(emb, self.seq_len, self.cnn_hid_dim,
+                             self.cnn_win_size, self.cnn_win_size2)
+        self.fc_1 = full_connect(concat, self.hid_dim1)
+        self.metrics(is_infer)
+
+    def metrics(self, is_infer=False):
+        """ classification and metrics """
+        # softmax layer
+        prediction = fluid.layers.fc(input=[self.fc_1],
+                                     size=self.class_dim,
+                                     act="softmax",
+                                     name="pretrain_fc_1")
+        cost = fluid.layers.cross_entropy(input=prediction, label=self.label)
+        avg_cost = fluid.layers.mean(x=cost)
+        acc = fluid.layers.accuracy(input=prediction, label=self.label)
+        #acc = RecallK(input=prediction, label=label, k=1)
+
+        self._cost = avg_cost
+        if is_infer:
+            self._infer_results["acc"] = acc
+        else:
+            self._metrics["acc"] = acc
+
+
+def embedding(inputs, dict_size, emb_dim, is_sparse):
+    """ embeding definition """
+    emb = fluid.layers.embedding(
+        input=inputs,
+        size=[dict_size, emb_dim],
+        is_sparse=is_sparse,
+        param_attr=fluid.ParamAttr(
+            name='pretrain_word_embedding',
+            initializer=fluid.initializer.Xavier()))
+    return emb
+
+
+def multi_convs(input_layer, seq_len, cnn_hid_dim, cnn_win_size,
+                cnn_win_size2):
+    """conv and concat"""
+    emb = fluid.layers.sequence_unpad(
+        input_layer, length=seq_len, name="pretrain_unpad")
+    conv = fluid.nets.sequence_conv_pool(
+        param_attr=fluid.ParamAttr(name="pretrain_conv0_w"),
+        bias_attr=fluid.ParamAttr(name="pretrain_conv0_b"),
+        input=emb,
+        num_filters=cnn_hid_dim,
+        filter_size=cnn_win_size,
+        act="tanh",
+        pool_type="max")
+    conv2 = fluid.nets.sequence_conv_pool(
+        param_attr=fluid.ParamAttr(name="pretrain_conv1_w"),
+        bias_attr=fluid.ParamAttr(name="pretrain_conv1_b"),
+        input=emb,
+        num_filters=cnn_hid_dim,
+        filter_size=cnn_win_size2,
+        act="tanh",
+        pool_type="max")
+    concat = fluid.layers.concat(
+        input=[conv, conv2], axis=1, name="pretrain_concat")
+    return concat
+
+
+def full_connect(input_layer, hid_dim1):
+    """full connect layer"""
+    fc_1 = fluid.layers.fc(name="pretrain_fc_0",
+                           input=input_layer,
+                           size=hid_dim1,
+                           act="tanh")
+    return fc_1
@@ -0,0 +1,70 @@
+# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+workspace: "models/contentunderstanding/textcnn_pretrain"
+
+dataset:
+- name: dataset_train
+  batch_size: 128
+  type: DataLoader
+  data_path: "{workspace}/senta_data/train"
+  data_converter: "{workspace}/reader.py"
+- name: dataset_infer
+  batch_size: 256
+  type: DataLoader
+  data_path: "{workspace}/senta_data/test"
+  data_converter: "{workspace}/reader.py"
+
+hyper_parameters:
+  optimizer:
+    class: adam
+    learning_rate: 0.001
+    strategy: async
+
+mode: [train_runner,infer_runner]
+
+runner:
+- name: train_runner
+  class: train
+  epochs: 6
+  device: cpu
+  save_checkpoint_interval: 1
+  save_checkpoint_path: "increment"
+  init_model_path: "" 
+  print_interval: 10
+  # startup class for finetuning
+  startup_class_path: "{workspace}/finetune_startup.py"
+  # path of pretrained model. Please set empty if you don't use finetune function.
+  init_pretraining_model_path: "{workspace}/pretrain_model/pretrain_model_params"
+ 
+  phases: phase_train
+
+- name: infer_runner
+  class: infer
+  # device to run training or infer
+  device: cpu
+  print_interval: 1
+  init_model_path: "increment/3" # load model path
+  phases: phase_infer
+
+  
+phase:
+- name: phase_train
+  model: "{workspace}/model.py"
+  dataset_name: dataset_train
+  thread_num: 1
+- name: phase_infer
+  model: "{workspace}/model.py" # user-defined model
+  dataset_name: dataset_infer # select dataset by name
+  thread_num: 1