|
|
|
@@ -173,8 +173,8 @@ test_sets = [ |
|
|
|
embedding_size=768, |
|
|
|
embedding_shape=[1, 128, 768], |
|
|
|
use_one_hot_embeddings=True, |
|
|
|
initializer_range=0.02), 1, 1), { |
|
|
|
'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
initializer_range=0.02), 1, 1), |
|
|
|
{'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
'desc_inputs': [input_ids], |
|
|
|
'desc_bprop': [[128]]}), |
|
|
|
('EmbeddingLookup_multi_outputs_init_param', { |
|
|
|
@@ -182,8 +182,8 @@ test_sets = [ |
|
|
|
embedding_size=768, |
|
|
|
embedding_shape=[1, 128, 768], |
|
|
|
use_one_hot_embeddings=False, |
|
|
|
initializer_range=0.02), { |
|
|
|
'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
initializer_range=0.02), |
|
|
|
{'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
'desc_inputs': [input_ids], |
|
|
|
'desc_bprop': [[1, 128, 768], [128]]}), |
|
|
|
('EmbeddingLookup_multi_outputs_grad_with_no_sens', { |
|
|
|
@@ -191,8 +191,8 @@ test_sets = [ |
|
|
|
embedding_size=768, |
|
|
|
embedding_shape=[1, 128, 768], |
|
|
|
use_one_hot_embeddings=False, |
|
|
|
initializer_range=0.02), { |
|
|
|
'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
initializer_range=0.02), |
|
|
|
{'init_param_with': lambda shp: np.ones(shp).astype(np.float32)}), |
|
|
|
'desc_inputs': [input_ids]}), |
|
|
|
('GetMaskedLMOutput_grad_with_no_sens', { |
|
|
|
'block': GetMaskedLMOutput(BertConfig(batch_size=1)), |
|
|
|
|