Created by: puleon
- new classes structure for siamese networks to perform ranking and paraphrase identification
- new preprocessor class to work with data samples containing few strings for siamese networks
- all components (including tokenizer, vocabularies and embedder) are standard and set in config
- new model with BiLSTM, GRU and max pooling to take into account multi-turn dialogue context
- configs for ranking on ubuntu v2 dialogue corpus with and without taking into account multi-turn context
- new predictor class for siamese networks to work in interact mode
- separate configs for interact mode
- bug fix in SimpleVocabulary class
- tests for all new configs
Activity
- Last updated by Andrei Glinskii
6 # 7 # http://www.apache.org/licenses/LICENSE-2.0 8 # 9 # Unless required by applicable law or agreed to in writing, software 10 # distributed under the License is distributed on an "AS IS" BASIS, 11 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 # See the License for the specific language governing permissions and 13 # limitations under the License. 14 15 16 from deeppavlov.core.data.dataset_reader import DatasetReader 17 from typing import List, Tuple, Union, Dict 18 19 from pathlib import Path 20 from deeppavlov.core.common.registry import register 21 import csv 16 from typing import List, Dict, Tuple, Union 17 from pathlib import Path 18 import csv 19 20 from deeppavlov.core.data.dataset_reader import DatasetReader 21 from deeppavlov.core.common.registry import register 22 from deeppavlov.core.commands.utils import expand_path 23 24 @register('ubuntu_v2_reader') 25 class UbuntuV2Reader(DatasetReader): 26 """The class to read the Ubuntu V2 dataset from csv files. 27 28 Please, see https://github.com/rkadlec/ubuntu-ranking-dataset-creator. 29 30 Args: 31 data_path: A path to a folder with dataset csv files. - Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
71 "triplet_loss": false, 72 "batch_size": 256, 73 "save_path": "ubuntu_v2_mt_model/model_weights.h5", 74 "load_path": "ubuntu_v2_mt_model/model_weights.h5" 75 }, 76 { 77 "in": ["x_proc"], 78 "in_y": ["y"], 79 "out": ["y_predicted"], 80 "name": "siamese_predictor", 81 "model": "#model", 82 "num_context_turns": "#model.num_context_turns", 83 "batch_size": "#model.batch_size", 84 "interact_pred_num": 3, 85 "responses": "#siam_sent_vocab", 86 "preproc_func": "#preproc.__call__" - Last updated by Andrei Glinskii
10 # distributed under the License is distributed on an "AS IS" BASIS, 11 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 # See the License for the specific language governing permissions and 13 # limitations under the License. 14 15 import numpy as np 16 from typing import List, Iterable, Union 17 18 from deeppavlov.core.models.nn_model import NNModel 19 20 21 class SiameseModel(NNModel): 22 """The class implementing base functionality for siamese neural networks. 23 24 Args: 25 batch_size: A size of a batch. 1 # Copyright 2017 Neural Networks and Deep Learning lab, MIPT 2 # 3 # Licensed under the Apache License, Version 2.0 (the "License"); 4 # you may not use this file except in compliance with the License. 5 # You may obtain a copy of the License at 6 # 7 # http://www.apache.org/licenses/LICENSE-2.0 8 # 9 # Unless required by applicable law or agreed to in writing, software 10 # distributed under the License is distributed on an "AS IS" BASIS, 11 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12 # See the License for the specific language governing permissions and 13 # limitations under the License. 14 15 import numpy as np 16 from typing import List, Iterable, Union - Last updated by Andrei Glinskii
64 self.batch_size = batch_size 65 self.num_context_turns = num_context_turns 66 self.ranking = ranking 67 self.attention = attention 68 self.responses = {el[1]: el[0] for el in responses.items()} 69 self.preproc_responses = [] 70 self.response_embeddings = None 71 self.preproc_func = preproc_func 72 self.interact_pred_num = interact_pred_num 73 self.model = model 74 self._build_preproc_responses() 75 if not self.attention: 76 self._build_response_embeddings() 77 78 def __call__(self, batch: Iterable[List[np.ndarray]]) -> List[Union[List[str],str]]: 79 context = next(batch) - Last updated by Andrei Glinskii
- Last updated by Andrei Glinskii
Please register or sign in to reply