outputs=(logits,)+transformer_outputs[1:]# Keep new_mems and attention/hidden states if they are here
returnoutputs
@add_start_docstrings("""XLM Model with a span classification head on top for extractive question-answering tasks like SQuAD (a linear layers on top of
the hidden-states output to compute `span start logits` and `span end logits`). """,