@@ -70,6 +70,7 @@ class XLMRobertaModel(RobertaModel):
7070 documentation alongside usage examples.
7171 """
7272
73+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
7374 config_class = XLMRobertaConfig
7475
7576
@@ -83,6 +84,7 @@ class XLMRobertaForCausalLM(RobertaForCausalLM):
8384 documentation alongside usage examples.
8485 """
8586
87+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
8688 config_class = XLMRobertaConfig
8789
8890
@@ -96,6 +98,7 @@ class XLMRobertaForMaskedLM(RobertaForMaskedLM):
9698 documentation alongside usage examples.
9799 """
98100
101+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
99102 config_class = XLMRobertaConfig
100103
101104
@@ -112,6 +115,7 @@ class XLMRobertaForSequenceClassification(RobertaForSequenceClassification):
112115 appropriate documentation alongside usage examples.
113116 """
114117
118+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
115119 config_class = XLMRobertaConfig
116120
117121
@@ -128,6 +132,7 @@ class XLMRobertaForMultipleChoice(RobertaForMultipleChoice):
128132 appropriate documentation alongside usage examples.
129133 """
130134
135+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
131136 config_class = XLMRobertaConfig
132137
133138
@@ -144,6 +149,7 @@ class XLMRobertaForTokenClassification(RobertaForTokenClassification):
144149 appropriate documentation alongside usage examples.
145150 """
146151
152+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
147153 config_class = XLMRobertaConfig
148154
149155
@@ -160,4 +166,5 @@ class XLMRobertaForQuestionAnswering(RobertaForQuestionAnswering):
160166 appropriate documentation alongside usage examples.
161167 """
162168
169+ _keys_to_ignore_on_load_missing = [r"lm_head.decoder.bias" , "position_ids" ]
163170 config_class = XLMRobertaConfig
0 commit comments