2 年前 · 3aa3562576
--- a/BiddingKG/dl/table_head/best_tiny.hdf5
+++ b/BiddingKG/dl/table_head/best_tiny.hdf5
--- a/BiddingKG/dl/table_head/models/model.py
+++ b/BiddingKG/dl/table_head/models/model.py
@@ -73,6 +73,124 @@ def model_1(input_shape, output_shape):
 
				     return model
			
 
				 
			
 
				 
			
 
				+def model_1_small(input_shape, output_shape):
			
 
				+    # Input (batch, 10, 60)
			
 
				+    input_1 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_2 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_3 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_4 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_5 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_6 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+
			
 
				+    # ----------- Three box sequence -----------
			
 
				+    # Concat (batch, 30, 60)
			
 
				+    concat_1 = layers.concatenate([input_1, input_2, input_3], axis=-2, name='seq_concat')
			
 
				+    concat_2 = layers.concatenate([input_4, input_5, input_6], axis=-2)
			
 
				+
			
 
				+    # Bi-LSTM (batch, 30, 128)
			
 
				+    bi_lstm_1 = layers.Bidirectional(layers.LSTM(32, return_sequences=True))(concat_1)
			
 
				+    bi_lstm_2 = layers.Bidirectional(layers.LSTM(32, return_sequences=True))(concat_2)
			
 
				+
			
 
				+    # Self-Attention (batch, 30, 128)
			
 
				+    self_attention_1 = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm_1)
			
 
				+    self_attention_2 = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm_2)
			
 
				+
			
 
				+    # Dense (batch, 30, 1)
			
 
				+    dense_1 = layers.Dense(output_shape[0], activation="relu")(self_attention_1)
			
 
				+    dense_2 = layers.Dense(output_shape[0], activation="relu")(self_attention_2)
			
 
				+
			
 
				+    # Squeeze (batch, 30)
			
 
				+    squeeze_1 = Lambda(lambda x: K.squeeze(x, axis=-1))(dense_1)
			
 
				+    squeeze_2 = Lambda(lambda x: K.squeeze(x, axis=-1))(dense_2)
			
 
				+
			
 
				+    # ----------- One box feature -----------
			
 
				+    # Bi-LSTM (batch, 10, 128)
			
 
				+    bi_lstm = layers.Bidirectional(layers.LSTM(32, return_sequences=True))(input_2)
			
 
				+
			
 
				+    # Self-Attention (batch, 10, 128)
			
 
				+    self_attention = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm)
			
 
				+
			
 
				+    # mask mean pooling
			
 
				+    # pool_1 = MyAveragePooling1D(axis=-1)(self_attention_1)
			
 
				+
			
 
				+    # Dense (batch, 10, 1)
			
 
				+    dense = layers.Dense(output_shape[0], activation="relu")(self_attention)
			
 
				+
			
 
				+    # Squeeze (batch, 10) - one box feature
			
 
				+    squeeze = Lambda(lambda x: K.squeeze(x, axis=-1))(dense)
			
 
				+
			
 
				+    # ----------- Three box sequence & One box feature -----------
			
 
				+    # Dense (batch, 1)
			
 
				+    concat = layers.concatenate([squeeze, squeeze_1, squeeze_2])
			
 
				+    output = layers.Dense(32, activation='relu')(concat)
			
 
				+    output = layers.Dense(1, activation="sigmoid", name='output')(output)
			
 
				+
			
 
				+    model = models.Model(inputs=[input_1, input_2, input_3, input_4, input_5, input_6],
			
 
				+                         outputs=output)
			
 
				+
			
 
				+    # model.summary()
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				+def model_1_tiny(input_shape, output_shape):
			
 
				+    # Input (batch, 10, 60)
			
 
				+    input_1 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_2 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_3 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_4 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_5 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+    input_6 = layers.Input(shape=input_shape[1:], dtype="float32")
			
 
				+
			
 
				+    # ----------- Three box sequence -----------
			
 
				+    # Concat (batch, 30, 60)
			
 
				+    concat_1 = layers.concatenate([input_1, input_2, input_3], axis=-2, name='seq_concat')
			
 
				+    concat_2 = layers.concatenate([input_4, input_5, input_6], axis=-2)
			
 
				+
			
 
				+    # Bi-LSTM (batch, 30, 128)
			
 
				+    bi_lstm_1 = layers.Bidirectional(layers.LSTM(16, return_sequences=True))(concat_1)
			
 
				+    bi_lstm_2 = layers.Bidirectional(layers.LSTM(16, return_sequences=True))(concat_2)
			
 
				+
			
 
				+    # Self-Attention (batch, 30, 128)
			
 
				+    self_attention_1 = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm_1)
			
 
				+    self_attention_2 = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm_2)
			
 
				+
			
 
				+    # Dense (batch, 30, 1)
			
 
				+    dense_1 = layers.Dense(output_shape[0], activation="relu")(self_attention_1)
			
 
				+    dense_2 = layers.Dense(output_shape[0], activation="relu")(self_attention_2)
			
 
				+
			
 
				+    # Squeeze (batch, 30)
			
 
				+    squeeze_1 = Lambda(lambda x: K.squeeze(x, axis=-1))(dense_1)
			
 
				+    squeeze_2 = Lambda(lambda x: K.squeeze(x, axis=-1))(dense_2)
			
 
				+
			
 
				+    # ----------- One box feature -----------
			
 
				+    # Bi-LSTM (batch, 10, 128)
			
 
				+    bi_lstm = layers.Bidirectional(layers.LSTM(16, return_sequences=True))(input_2)
			
 
				+
			
 
				+    # Self-Attention (batch, 10, 128)
			
 
				+    self_attention = SeqSelfAttention(attention_activation='sigmoid')(bi_lstm)
			
 
				+
			
 
				+    # mask mean pooling
			
 
				+    # pool_1 = MyAveragePooling1D(axis=-1)(self_attention_1)
			
 
				+
			
 
				+    # Dense (batch, 10, 1)
			
 
				+    dense = layers.Dense(output_shape[0], activation="relu")(self_attention)
			
 
				+
			
 
				+    # Squeeze (batch, 10) - one box feature
			
 
				+    squeeze = Lambda(lambda x: K.squeeze(x, axis=-1))(dense)
			
 
				+
			
 
				+    # ----------- Three box sequence & One box feature -----------
			
 
				+    # Dense (batch, 1)
			
 
				+    concat = layers.concatenate([squeeze, squeeze_1, squeeze_2])
			
 
				+    output = layers.Dense(16, activation='relu')(concat)
			
 
				+    output = layers.Dense(1, activation="sigmoid", name='output')(output)
			
 
				+
			
 
				+    model = models.Model(inputs=[input_1, input_2, input_3, input_4, input_5, input_6],
			
 
				+                         outputs=output)
			
 
				+
			
 
				+    # model.summary()
			
 
				+    return model
			
 
				+
			
 
				+
			
 
				 def model_2(input_shape, output_shape):
			
 
				     # input_shape = (None, None, 10, 60)
			
 
				     # (batch_size, row_num, col_num, character_num, character_embedding)
			
@@ -266,7 +384,7 @@ def model_3(input_shape, output_shape):
 
				 
			
 
				 def get_model(input_shape, output_shape, model_id):
			
 
				     if model_id == 1:
			
 
				-        return model_1(input_shape, output_shape)
			
 
				+        return model_1_tiny(input_shape, output_shape)
			
 
				     elif model_id == 2:
			
 
				         return model_2(input_shape, output_shape)
			
 
				     elif model_id == 3:
			
--- a/BiddingKG/dl/table_head/predict.py
+++ b/BiddingKG/dl/table_head/predict.py
@@ -24,7 +24,7 @@ if model_id == 1:
 
				 else:
			
 
				     input_shape = (None, None, 20, 60)
			
 
				     output_shape = (None, None)
			
 
				-keras_model_path = os.path.abspath(os.path.dirname(__file__)) + "/best.hdf5"
			
 
				+keras_model_path = os.path.abspath(os.path.dirname(__file__)) + "/best_tiny.hdf5"
			
 
				 # keras模型加载预测都使用同一个session、同一个graph，即可多进程推理
			
 
				 session_conf = tf.ConfigProto(
			
 
				     intra_op_parallelism_threads=5,
			
@@ -52,6 +52,7 @@ sess = tf.Session(graph=tf.Graph(), config=session_conf)
 
				 
			
 
				 
			
 
				 def predict(table_text_list, model_id=1):
			
 
				+    start_time = time.time()
			
 
				     if globals().get("model") is None:
			
 
				         print("="*15, "init table_head model", "="*15)
			
 
				         with sess.as_default():
			
@@ -97,6 +98,7 @@ def predict(table_text_list, model_id=1):
 
				 
			
 
				     # 打印保存结构
			
 
				     # save_print_result(table_text_list, table_label_list)
			
 
				+    # print("table_head predict cost", str(time.time()-start_time))
			
 
				     return table_label_list
			
 
				 
			
 
				 
			
--- a/BiddingKG/dl/table_head/train.py
+++ b/BiddingKG/dl/table_head/train.py
@@ -19,10 +19,10 @@ if model_id == 1:
 
				     output_shape = (1,)
			
 
				     batch_size = 128
			
 
				     epochs = 1000
			
 
				-    PRETRAINED = True
			
 
				+    PRETRAINED = False
			
 
				     CHECKPOINT = False
			
 
				     # 用GPU
			
 
				-    os.environ["CUDA_VISIBLE_DEVICES"] = "1"
			
 
				+    os.environ["CUDA_VISIBLE_DEVICES"] = "0"
			
 
				 else:
			
 
				     input_shape = (None, None, 20, 60)
			
 
				     output_shape = (None, None)
			
@@ -92,7 +92,7 @@ def train():
 
				                   # loss_weights={"output": 0.5},
			
 
				                   metrics=['acc', precision, recall, f1])
			
 
				 
			
 
				-    rlu = ReduceLROnPlateau(monitor='val_f1', factor=0.1, patience=10,
			
 
				+    rlu = ReduceLROnPlateau(monitor='val_f1', factor=0.5, patience=10,
			
 
				                             verbose=1, mode='max', cooldown=0, min_lr=0)
			
 
				 
			
 
				     model.fit_generator(train_data_loader,