Update artist model activateion (#3106)

JunnYu · web-flow · commit d6f460e54ab4 · 2022-10-08T10:45:02.000+08:00
* update

* rename
diff --git a/paddlenlp/transformers/artist/modeling.py b/paddlenlp/transformers/artist/modeling.py
@@ -14,6 +14,7 @@
 # limitations under the License.
 
 import paddle
+import paddle.nn.functional as F
 from ..dallebart.modeling import VQGanDetokenizer
 from ..gpt.modeling import GPTLMHeadModel, GPTLMHead, GPTModel
 
@@ -23,14 +24,17 @@
     'ArtistForConditionalGeneration',
 ]
 
+# set gelu_new
+F.gelu_python = F.gelu
+
 pretrained_init_configuration = {
     "pai-painter-base-zh": {
         "vocab_size": 37512,
         "hidden_size": 768,
         "num_hidden_layers": 12,
         "num_attention_heads": 12,
         "intermediate_size": 3072,
-        "hidden_act": "gelu",
+        "hidden_act": "gelu_python",
         "hidden_dropout_prob": 0.0,
         "attention_probs_dropout_prob": 0.0,
         "max_position_embeddings": 288,
@@ -47,7 +51,7 @@
         "num_hidden_layers": 12,
         "num_attention_heads": 12,
         "intermediate_size": 3072,
-        "hidden_act": "gelu",
+        "hidden_act": "gelu_python",
         "hidden_dropout_prob": 0.0,
         "attention_probs_dropout_prob": 0.0,
         "max_position_embeddings": 288,
@@ -64,7 +68,7 @@
         "num_hidden_layers": 12,
         "num_attention_heads": 12,
         "intermediate_size": 3072,
-        "hidden_act": "gelu",
+        "hidden_act": "gelu_python",
         "hidden_dropout_prob": 0.0,
         "attention_probs_dropout_prob": 0.0,
         "max_position_embeddings": 288,
@@ -81,7 +85,7 @@
         "num_hidden_layers": 12,
         "num_attention_heads": 12,
         "intermediate_size": 3072,
-        "hidden_act": "gelu",
+        "hidden_act": "gelu_python",
         "hidden_dropout_prob": 0.0,
         "attention_probs_dropout_prob": 0.0,
         "max_position_embeddings": 288,
@@ -98,7 +102,7 @@
         "num_hidden_layers": 24,
         "num_attention_heads": 16,
         "intermediate_size": 4096,
-        "hidden_act": "gelu",
+        "hidden_act": "gelu_python",
         "hidden_dropout_prob": 0.0,
         "attention_probs_dropout_prob": 0.0,
         "max_position_embeddings": 288,
diff --git a/paddlenlp/transformers/dallebart/tokenizer.py b/paddlenlp/transformers/dallebart/tokenizer.py
@@ -101,7 +101,7 @@ def best_match(i):
 
 def replace_person_token(t):
     "Used for CC12M"
-    t = re.sub("<person>([,\s]*(and)*[,\s]*<person>)+", " people ", t)
+    t = re.sub(r"<person>([,\s]*(and)*[,\s]*<person>)+", " people ", t)
     while "<person>" in t:
         t = t.replace("<person>",
                       f" {random.choices(*tuple(zip(*person_token)))[0]} ", 1)
@@ -114,27 +114,27 @@ def fix_html(t):
 
 
 def replace_punctuation_with_commas(t):
-    return re.sub("[()[\].,|:;?!=+~\-\/{}]", ",", t)
+    return re.sub(r"[()[\].,|:;?!=+~\-\/{}]", ",", t)
 
 
 def simplify_quotes(t):
     return re.sub("""['"`]""", ' " ', t)
 
 
 def merge_quotes(t):
-    return re.sub('(\s*"+\s*)+', ' " ', t)
+    return re.sub(r'(\s*"+\s*)+', ' " ', t)
 
 
 def remove_comma_numbers(t):
 
     def _f(t):
-        return re.sub("(\d),(\d{3})", r"\1\2", t)
+        return re.sub(r"(\d),(\d{3})", r"\1\2", t)
 
     return _f(_f(t))
 
 
 def pre_process_dot_numbers(t):
-    return re.sub("(\w)\.(\w)", rf"\1{temp_token}dot{temp_token}\2", t)
+    return re.sub(r"(\w)\.(\w)", rf"\1{temp_token}dot{temp_token}\2", t)
 
 
 def post_process_dot_numbers(t):
@@ -152,15 +152,15 @@ def post_process_quotes(t):
 
 
 def pre_process_dates(t):
-    return re.sub("(\d)/(\d)", rf"\1{temp_token}slash{temp_token}\2", t)
+    return re.sub(r"(\d)/(\d)", rf"\1{temp_token}slash{temp_token}\2", t)
 
 
 def post_process_dates(t):
     return re.sub(f"{temp_token}slash{temp_token}", "/", t)
 
 
 def merge_commas(t):
-    return re.sub("(\s*,+\s*)+", ", ", t)
+    return re.sub(r"(\s*,+\s*)+", ", ", t)
 
 
 def add_space_after_commas(t):
@@ -170,14 +170,14 @@ def add_space_after_commas(t):
 def handle_special_chars(t):
     "Handle special characters"
     # replace "-" with a space when between words without space
-    t = re.sub("(\w)-(\w)", r"\1 \2", t)
+    t = re.sub(r"(\w)-(\w)", r"\1 \2", t)
     # always add space around some characters
-    return re.sub("([%&\/$*])", r" \1 ", t)
+    return re.sub(r"([%&\/$*])", r" \1 ", t)
 
 
 def expand_hashtags(t, hashtag_processor):
     "Remove # and try to split words"
-    return re.sub("#(\w+)", lambda m: hashtag_processor(m.group(1)), t)
+    return re.sub(r"#(\w+)", lambda m: hashtag_processor(m.group(1)), t)
 
 
 _re_ignore_chars = r"[_#\\]"
@@ -190,7 +190,7 @@ def ignore_chars(t):
 
 def remove_extra_spaces(t):
     "Remove extra spaces (including \t and \n)"
-    return re.sub("\s+", " ", t)
+    return re.sub(r"\s+", " ", t)
 
 
 def remove_repeating_chars(t):