mirror of
https://github.com/huggingface/transformers.git
synced 2025-07-31 10:12:23 +06:00
![]() * Remove "Model" suffix from Flax models to look more 🤗 Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Initial working (forward + backward) for Flax MLM training example. Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Simply code Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Addressing comments, using module and moving to LM task. Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Restore parameter name "module" wrongly renamed model. Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Restore correct output ordering... Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Actually commit the example 😅 Signed-off-by: Morgan Funtowicz <morgan@huggingface.co> * Add FlaxBertModelForMaskedLM after rebasing. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Make it possible to initialize the training from scratch Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Reuse flax linen example of cross entropy loss Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Added specific data collator for flax Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Remove todo for data collator Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Added evaluation step Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Added ability to provide dtype to support bfloat16 on TPU Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Enable flax tensorboard output Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Enable jax.pmap support. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Ensure batches are correctly sized to be dispatched with jax.pmap Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Enable bfloat16 with --fp16 cmdline args Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Correctly export metrics to tensorboard Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Added dropout and ability to use it. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Effectively enable & disable during training and evaluation steps. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Oops. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Enable specifying kernel initializer scale Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Style. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Added warmup step to the learning rate scheduler. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Fix typo. Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Print training loss Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Make style Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * fix linter issue (flake8) Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Fix model matching Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Fix dummies Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Fix non default dtype on Flax models Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Use the same create_position_ids_from_input_ids for FlaxRoberta Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Make Roberta attention as Bert Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * fix copy Signed-off-by: Morgan Funtowicz <funtowiczmo@gmail.com> * Wording. Co-authored-by: Marc van Zee <marcvanzee@gmail.com> Co-authored-by: Marc van Zee <marcvanzee@gmail.com> |
||
---|---|---|
.. | ||
fixtures | ||
__init__.py | ||
conftest.py | ||
test_activations_tf.py | ||
test_activations.py | ||
test_benchmark_tf.py | ||
test_benchmark.py | ||
test_cli.py | ||
test_configuration_auto.py | ||
test_configuration_common.py | ||
test_data_collator.py | ||
test_doc_samples.py | ||
test_file_utils.py | ||
test_flax_auto.py | ||
test_generation_beam_search.py | ||
test_generation_logits_process.py | ||
test_generation_utils.py | ||
test_hf_api.py | ||
test_hf_argparser.py | ||
test_logging.py | ||
test_model_card.py | ||
test_model_output.py | ||
test_modeling_albert.py | ||
test_modeling_auto.py | ||
test_modeling_bart.py | ||
test_modeling_bert_generation.py | ||
test_modeling_bert.py | ||
test_modeling_blenderbot.py | ||
test_modeling_camembert.py | ||
test_modeling_common.py | ||
test_modeling_ctrl.py | ||
test_modeling_deberta.py | ||
test_modeling_distilbert.py | ||
test_modeling_dpr.py | ||
test_modeling_electra.py | ||
test_modeling_encoder_decoder.py | ||
test_modeling_flaubert.py | ||
test_modeling_flax_bert.py | ||
test_modeling_flax_roberta.py | ||
test_modeling_fsmt.py | ||
test_modeling_funnel.py | ||
test_modeling_gpt2.py | ||
test_modeling_layoutlm.py | ||
test_modeling_longformer.py | ||
test_modeling_lxmert.py | ||
test_modeling_marian.py | ||
test_modeling_mbart.py | ||
test_modeling_mobilebert.py | ||
test_modeling_mpnet.py | ||
test_modeling_mt5.py | ||
test_modeling_openai.py | ||
test_modeling_pegasus.py | ||
test_modeling_prophetnet.py | ||
test_modeling_rag.py | ||
test_modeling_reformer.py | ||
test_modeling_roberta.py | ||
test_modeling_squeezebert.py | ||
test_modeling_t5.py | ||
test_modeling_tf_albert.py | ||
test_modeling_tf_auto.py | ||
test_modeling_tf_bart.py | ||
test_modeling_tf_bert.py | ||
test_modeling_tf_blenderbot.py | ||
test_modeling_tf_camembert.py | ||
test_modeling_tf_common.py | ||
test_modeling_tf_ctrl.py | ||
test_modeling_tf_distilbert.py | ||
test_modeling_tf_dpr.py | ||
test_modeling_tf_electra.py | ||
test_modeling_tf_flaubert.py | ||
test_modeling_tf_funnel.py | ||
test_modeling_tf_gpt2.py | ||
test_modeling_tf_longformer.py | ||
test_modeling_tf_lxmert.py | ||
test_modeling_tf_marian.py | ||
test_modeling_tf_mbart.py | ||
test_modeling_tf_mobilebert.py | ||
test_modeling_tf_mpnet.py | ||
test_modeling_tf_mt5.py | ||
test_modeling_tf_openai.py | ||
test_modeling_tf_pegasus.py | ||
test_modeling_tf_pytorch.py | ||
test_modeling_tf_roberta.py | ||
test_modeling_tf_t5.py | ||
test_modeling_tf_transfo_xl.py | ||
test_modeling_tf_xlm_roberta.py | ||
test_modeling_tf_xlm.py | ||
test_modeling_tf_xlnet.py | ||
test_modeling_transfo_xl.py | ||
test_modeling_xlm_prophetnet.py | ||
test_modeling_xlm_roberta.py | ||
test_modeling_xlm.py | ||
test_modeling_xlnet.py | ||
test_onnx.py | ||
test_optimization_tf.py | ||
test_optimization.py | ||
test_pipelines_common.py | ||
test_pipelines_conversational.py | ||
test_pipelines_feature_extraction.py | ||
test_pipelines_fill_mask.py | ||
test_pipelines_ner.py | ||
test_pipelines_question_answering.py | ||
test_pipelines_sentiment_analysis.py | ||
test_pipelines_summarization.py | ||
test_pipelines_text_generation.py | ||
test_pipelines_text2text_generation.py | ||
test_pipelines_translation.py | ||
test_pipelines_zero_shot.py | ||
test_retrieval_rag.py | ||
test_skip_decorators.py | ||
test_tokenization_albert.py | ||
test_tokenization_auto.py | ||
test_tokenization_bart.py | ||
test_tokenization_barthez.py | ||
test_tokenization_bert_generation.py | ||
test_tokenization_bert_japanese.py | ||
test_tokenization_bert.py | ||
test_tokenization_bertweet.py | ||
test_tokenization_blenderbot.py | ||
test_tokenization_camembert.py | ||
test_tokenization_common.py | ||
test_tokenization_ctrl.py | ||
test_tokenization_deberta.py | ||
test_tokenization_distilbert.py | ||
test_tokenization_dpr.py | ||
test_tokenization_fsmt.py | ||
test_tokenization_funnel.py | ||
test_tokenization_gpt2.py | ||
test_tokenization_herbert.py | ||
test_tokenization_layoutlm.py | ||
test_tokenization_lxmert.py | ||
test_tokenization_marian.py | ||
test_tokenization_mbart.py | ||
test_tokenization_mpnet.py | ||
test_tokenization_openai.py | ||
test_tokenization_pegasus.py | ||
test_tokenization_phobert.py | ||
test_tokenization_prophetnet.py | ||
test_tokenization_rag.py | ||
test_tokenization_reformer.py | ||
test_tokenization_roberta.py | ||
test_tokenization_squeezebert.py | ||
test_tokenization_t5.py | ||
test_tokenization_transfo_xl.py | ||
test_tokenization_utils.py | ||
test_tokenization_xlm_prophetnet.py | ||
test_tokenization_xlm_roberta.py | ||
test_tokenization_xlm.py | ||
test_tokenization_xlnet.py | ||
test_trainer_callback.py | ||
test_trainer_distributed.py | ||
test_trainer_tpu.py | ||
test_trainer_utils.py | ||
test_trainer.py | ||
test_utils_check_copies.py | ||
test_versions_utils.py |