mirror of
https://github.com/saymrwulf/transformers.git
synced 2026-05-14 20:58:08 +00:00
Commit graph
Select branches
Hide pull requests
'delete-delete-doc'
29625_add_prefix_space
29625_prefix_space
30824-spmconverter-user-defined-symbol
31187_depreciate_clean_up_tokenization_spaced
BritneyMuller-housekeeping-patch
LysandreJik-patch-1
_dummy_fix_weight_only_usage
_dummy_fix_weight_only_usage_2
add-deci-lm
add-flash-decoding
add-fp8-llama-script
add-git-lfs-to-amd-image
add-qgalore
add-rwkv5
add-warning-4bit-opti
add_amd_daily_ci
add_back_generative_class
add_deformable_detr
add_fa2_bart
add_important_warning_padding_attention_mask
add_kosmos_2_remote
add_kosmos_2_temp
add_kosmos_2_utm5_attn
add_kosmos_2_utm5_attn_rebased
add_kosmos_2_utm5_attn_rebased_flat_layer_structure
add_num_workers_for_tf
add_pipeline_equivalence_testing
add_prefix_space_29625
add_prefix_space_clean
add_siglip_fast_tokenizer_bis
add_tf_export_doc
add_word_level_timestamp_long
adding_fp8_quantization
agent_callback
agents-count-tokens
agents-make-easier-tags
agents-messages
albertvillanova-patch-1
allow_old_falcon_name
amd-nightly-ci
amdgpu-multi-gpu-tests
another_prepare_dataset_fix
api_big2
arijitx/wav2vec2_alignment
assistant_decoding_batch
attn-implementation-vision-enc-dec
auot-convert-tekken
auto-assign-reviewers
auto_gpt4_conversion
autoformer-test-seq-to-seq-add-atol
best_benchmark
best_benchmark_new
best_benchmark_on_static_cache
best_benchmark_on_static_cache_new
bloom_big
bos_eos_token_fix
bos_eos_token_slow
build-check-deepspeed-image
build-docker-torch-2.2
build_ci_docker_image_amd1
build_ci_docker_image_amd2
build_ci_docker_image_amd3
build_docker_on_kube
build_docker_on_kube_2
build_docker_on_kube_3
build_image_abc
byebye
byebye_py_37
cache_exp
change-ci
chat_template_kwargs
check-deepspeed
check-send-headers-when-converting-safetensors
check-whisper-slow-tests
check_amd_image_build
check_compile
check_compile_if_flaky
check_doc_test
check_docker_i
check_ds
check_example_ci
check_example_job
check_fastspeech
check_fix_fix_fix
check_fix_torch_pip
check_flaky
check_flax_example
check_gated_repo
check_gemma
check_gemma_compile
check_gemma_compile_2
check_gen_2
check_layoutlm
check_layoutlmv2
check_limit
check_mem
check_mem_00c1d87
check_mem_3cefac1d
check_mem_56b64bf
check_mem_838b87a
check_nightly_build
check_nightly_build_build_image
check_nougat
check_past_runner
check_permission
check_quant
check_quantized_param_bnb4
check_report
check_safetensors_rc
check_slow_pr
check_speed_no_empty
check_strange_doctest
check_tiny_creation
check_torch_2.2
check_trigger_4d8427f7
check_trigger_a81cf9ee
check_update_cache_number
check_ved_trocr
check_what_wrong_in_tiny_creation
checkout-layoutlm-tokenizers
chunk_length_ctc
ci-amdgpu-build-docker-images
ci-amdgpu-mi250
ci-amdgpu-nightly
ci-test-huggingface-hub-v0.15.0.rc0
ci-test-huggingface-hub-v0.16.0.rc0
ci-test-huggingface-hub-v0.17.0.rc0
ci-test-huggingface-hub-v0.18.0.rc0
ci-test-huggingface-hub-v0.19.0.rc0
ci-test-huggingface-hub-v0.20.0.rc1
ci-test-huggingface-hub-v0.21.0.rc0
ci-test-huggingface-hub-v0.22.0.rc0
ci-test-huggingface-hub-v0.23.0.rc0
ci-test-huggingface-hub-v0.23.0.rc1
ci-test-huggingface-hub-v0.24.0.rc0
ci-test-huggingface-hub-v0.25.0.rc0
ci-test-huggingface-hub-v0.25.0.rc1
ci-test-huggingface-hub-v0.26.0.rc0
ci-test-huggingface-hub-v0.27.0.rc0
ci-test-huggingface-hub-v0.27.0.rc1
ci-test-huggingface-hub-v0.27.0rc1
ci-test-huggingface-hub-v0.28.0.rc0
ci-test-huggingface-hub-v0.28.0.rc5
circleci_combine_reports
circleci_debug_base
circleci_debug_base_MobileNetV1ModelTest_test_batching_equivalence
circleci_debug_base_timm
circleci_debug_base_timm_3
clean_spmcoverter
cohere-diff
cohere-diff-2
compare_ci_with_torch_2.2
compile-rope
continuous-batching
custom_bloom_kernel
databricks
dduf-compability
dduf-compatibility-with-file-explorer
deberta-xla-fixes
debug_bloom
debug_get_jobs
debug_kosmos_2_output
debug_mem_0b192de1
debug_mem_95b37495
debug_metadata_run
debugdebug
debugdebug-2
debugdebug-5
deepseek_v2_support
deepspeed-amd-pytorch-version-fix
default-auto
default-fast-load
delete_big_tokenizer_block
deprecate_LegacyIndex
disable_multi_gpu
doc-builder
doc-link-one-or-two-papers-lysandre
doc-regactor
doc_builder_rename
doc_pr
docker_change_awq_version
docs-ctrl-lys
dont-use-deprecated-method
drop_py38_build_img_2
ds-fix-resume
ds-ignore_mismatched_sizes
dynamic_length_in_static_cache
dynamic_length_in_static_cache_001
dynamic_length_in_static_cache_002
dynamic_length_in_static_cache_reconstruct_tensors_from_length
dynamic_length_on_0ae789e0
dynamic_length_on_75bbfd5b
dynamic_length_on_95b3c381
dynamic_length_on_b6eb708b
enable_tf_numpy
faster_cache_without_compile
faster_copies
faster_set_initialized_submodules
fire
fix-Parameter-init
fix-Seq2SeqTrainingArguments-doc
fix-autoprocessor-import-order
fix-bnb-warning
fix-ci
fix-ci-setup
fix-copies
fix-device-map
fix-doc-builder-edit
fix-flash-comment
fix-from-pretrained
fix-gemma2-sdpa
fix-gemma2-sliding-window
fix-gpt2-scaled-init
fix-int8-serilation
fix-kwargs-issues
fix-llama-3-gguf
fix-pipeline-predict-transform-methods
fix-pixtral-tests
fix-pytorch-deepspeed-image
fix-quality-2
fix-red-ci-atol
fix-slow-tests-shieh-trigger
fix-task-mappings
fix-word-ids
fix-workflow
fix_TFMarianModelTest_test_xla_generate_slow
fix_aria_ci
fix_auto_test
fix_autoawq_docker
fix_autoawq_test
fix_bamba_test
fix_check_copies
fix_chinese_clip
fix_convert_spm_bpe
fix_deprecation_warnings
fix_dinat_2
fix_dinov2
fix_docker_autoawq
fix_docker_autogptq_from_source
fix_doctest
fix_doctest_based_on_refactor_doctest_2
fix_eetq_test
fix_falcon_processor
fix_flaky_4
fix_flaky_test_assisted_decoding_matches_greedy_search
fix_flaky_test_pt_tf_model_equivalence
fix_fp_32
fix_generate_embeds
fix_gptq_test
fix_gptq_tests
fix_jetmoe
fix_more_input_out
fix_not_init
fix_peft_model_in_pipelines
fix_pipe_tests_001
fix_quanto_llama27b
fix_remote_tool
fix_slow_gen_on_0ae789e0
fix_slow_gen_on_75bbfd5b
fix_slow_gen_on_b6eb708b
fix_st5_docs
fix_stupid_cond
fix_test_encode_decode
fix_test_fetcher_tests
fix_tie
fix_whisper_ci
fix_whisper_tflite_export
fix_zh_quicktour_md
flex_attention_qwen2
flex_attn_example
for_test_run_squad_no_trainer
force-convert
full-bf16-train
full_length_on_468f7cca
full_length_on_68b71c85
full_length_on_862cde4c
gemma_allow_compile
general_test_low_cpu_mem
get_bad_commits_for_daily_ci_11_20
get_bad_commits_for_daily_ci_11_26
gpt-flex-attention
gpt-mqa
gptneo_gpt4_port
gptneo_gpt4_port_new
hardware-auto-setup
hardware-auto-setup-ci
hotfix_ci_222
hqq_serialization
idefics3
ifix_aqlm_modules_to_not_convert
improve_error_message_asr_pipeline
improve_error_message_when_transformers_is_misconfigured
improve_torch_version_check
informative-detr-message
init_round_2
init_round_5
int
inverse_chat_templates
jeffboudier-transformers-docs-ad-copy
jnp_devicearray
keras-core-support
keras3_compatibility_phase_2
keras_3_compatibility
larger_runner
less-constraints
link-to-the-hub
llama-break-fix
llama-pad-side
llama-refactor
load_pretrainedfast_auto
make-cache-traceable
mark_whisper_test_slow
master
measure_all_tests
measure_gen
measure_gen_on_0ae789e0
measure_gen_on_75bbfd5b
measure_gen_on_b6eb708b
merge_text2text_into_text_generation
ministral
mitigate_tf_stride_vulnerability
modular-roberta
modular-stablelm
more_reduced_dummy_memory_usage
more_tf_int_dtypes
moshi-integration
move_jobs_from_daily_ci_channel
move_part_2
muellerzr-accum-plugin
muellerzr-ds-investigation
muellerzr-dummy-pr
muellerzr-enable-quant
muellerzr-enable-torchdata
muellerzr-fix-autocast
muellerzr-fix-integration-tests
muellerzr-fix-reentrant
muellerzr-fix-timeout
muellerzr-free-memory
muellerzr-free-memory-passthrough
muellerzr-jobs
muellerzr-less-fixes
muellerzr-lr-sched-right-version
muellerzr-metrics
muellerzr-modeling
muellerzr-more-ga-tests-fast
muellerzr-more-models-sadface
muellerzr-multinode-save
muellerzr-network-retry
muellerzr-skip-dvc
muellerzr-skip-failing-example
muellerzr-speedup-modular-conversion
muellerzr-trainer-refactor
muellerzr-transformers-should-not-set-env-variables
muellerzr-use-scientific
mymain
new-split
nezha_slow
nit-ga-condition
nit-modular-reame
nit-refactor
nit-remove-irrelevant-comment
nit_cleanup
nits-attention
no_more_shape_list
no_overwrite_test_batching_equivalence
noua/bloom_cugraph
np2
on_predict
onnx_gpt2_io_definition
output_ragged
pin-ffspec
pin-gguf
pin_ds
ping_author
ping_author_6
pipeline-revision-mirror
pipelines_signatures
pixtral_batchmixfeature_fix
pixtral_processor_structure_fix
post-action-build-test-tokenizers-main
processor-template-duplicated-tokens
protobuf-4
push-ci-image
quickfix_generate_tests
reenable_test
refactor-attention-converesion
refactor-from-pretrained
refactor_doctest_2
refactoring-new-version
relative-paths
remove-cache-migration-script
remove-items
remove-torch-pre-releases-amd-image
remove-warnings
repro-bug-pytorch-compile
repro-bug-pytorch-compile-cudagraph
reset_logger_level_2
resnet_with_variants
reverse_templating
revert-17547-update-support-image
revert-17646-skip_repo_not_found
revert-31494-add_dac
revert-33934-patch-1
revert-checkpoint-tmp-dir
revert-commit-30302
revert_hard_error2
robust_config_ckpt_check
run-amd
run-fix-Parameter-init
run-move-integrations
run_add_tts_pip
run_amd_push_ci_caller
run_amd_scheduled_ci_caller
run_amd_scheduled_ci_caller_testing
run_amd_scheduled_ci_caller_testing1
run_better_job_artifact_name
run_better_report
run_bon_courage
run_check_auto_mapping_importable
run_check_natten
run_ci_manually
run_daily_ci
run_daily_ci_11_20
run_daily_ci_11_21
run_deepspeed_ci
run_doctest_after_merge
run_doctest_ci
run_ds_ci
run_fc639143
run_fc639143_001
run_fc639143_002
run_fc639143_003
run_feat/kv_cache_class
run_fix_doc_on_circleci
run_fix_error_not_captured
run_nightly_ci_test_new_runner
run_no_job_name
run_past_ci_2nd
run_refactor_doctest
run_run_all_tests
run_run_amd_scheduled_ci_caller_deepspeed_test
run_scheduled_ci_now
run_scheduled_ci_now_2
run_scheduled_ci_now_3
run_scheduled_ci_now_4
run_scheduled_ci_now_5
run_scheduled_ci_now_6
run_sep_model_and_other_no_model_n_8_all_models
run_show_failure_better
run_split_daily_ci_based_on_no_job_name
run_split_daily_ci_based_on_no_job_name_2
run_tiny_with_fix_tiny_model_creation
run_torch_v_2_1
run_trigger_ci_when_tiny_summary_modified
run_truncate
run_update_tiny_002
run_use_main_in_conversion_script
safe_ci_report
safe_serialization_always_valid
safetensors-0.4.2
safetensors-step-2-2
safetensors_pre_release
safetensors_rc
scale
secure-amd-ci
shieh-length_in_compile
show_failure
simplify
simplify-contributions-init
simplify-contributions-inits
simplify-contributions-main-init
simplify-contributions-model_init
skip-tokenizer-test
skip_2_hub_tests
skip_blip2_torchscript
skip_idefics_doctest
sliding-window
smangrul/fix-auto-batch-finder-trainer-issue
smangrul/integrate-accelerate
smangrul/starcoder-int4-ddp-flash-attn
split_daily_ci
spmconverter_user_symbols
ssh_new_cluster
starcoder-2-fix
stas00-patch-1
state_spaces_call_for_contribution
stop-ci-on-fail-doc
stop-throwing-cache-warning
support-copy
sync-table-question-answering
sync_dqa_pipeline
sync_token_classification_and_zero_shot
sync_vqa_pipeline
t5-fp16-no-nans
temp-disable-scheduled-amd-ci
temp-kosmos25
temporary_pin_torch_2
tensor-cache
test-bin-format
test-build-ci-uv
test-datasets-2.14
test-datasets-2.21
test-datasets-3.0
test-datasets-main
test-datasets-pr
test-deepseek-fp8
test-doctests
test-eetq-dockerfile
test-fa2
test-huggingface_hub-pre-release
test-new-doc-builder-workflow
test-seentok
test-tokenizer-release
test-tokenizers-main
test_bc_tokenizers
test_ci
test_composition_2
test_composition_lysandre
test_composition_remote_tool
test_doc
test_docker_run_quantization
test_if_token
test_release_candidates
test_run_scheduler_ci
test_safetensors
test_safetensors_0.5.0
test_safetensors_abi3
test_tokenizers_0.19.0rc0
test_tokenizers_abi3
tf_forced_logits_xla_compatible
tf_int64_tests
tf_llama_port
tf_new_dummy_building
tf_quicktour_fix
tfconvnext
thomas/accelerate_gpt2
thomas/accelerate_gptj
thomas/add_custom_kernels
thomas/bloom_allow_fp32_lm_head
thomas/dirty_bloom_tp
thomas/fix_bloom
thomas/improve_bloom_generation_speed
thomas/llama
thomas/make_tp_bloom_generate_work
thomas/make_tp_work_with_bloom
tied_weights_load
tied_weights_warning_check
timm_wrapper_kwargs
tok-update
tokenizer-release
tokenizers_rc1
tools-inference-endpoints
torch-2.2-on-daily-ci
torch_versions
tp-loading
tp-support
trad_fixes
trainer-hyperparameter-search-kwargs-docs-update
trigger-amd-image-build
trigger_ci_with_torch_2_4
trigger_daily_ci
trigger_debug
trigger_disable_multi_gpu
trigger_doc
trigger_pt_10_past_ci
trigger_run_amd_scheduled_ci_caller_deepspeed_test
trigger_slow
trigger_test_cached_model_has_minimum_calls_to_head
trigger_upload_artifacts_3
try_comment_bot
try_fix_whisper_slow_test
try_matrix_fail
try_new_natten
try_new_natten_2
try_pydantic_v2_build_images
try_run_amd_push_ci_caller
try_sub
update-add-new-model
update-cooki
update-doc-gpu
update-from-pretrained
update-quantization-docker
update-special-tokens
update-tokenizers-version
update_27265
update_kosmos_2_file
update_llama_template
update_ssh
upgrade_tokenizers2
use-hfh-loading-saving-state-dict-helpers
use-process-retry-on-amd-smi
use-safetensors-from-pr
use-uv-
use_pt_25_image
v3.5.1hotfix
v4.0.0-release
v4.0.1-release
v4.10.0
v4.10.0-release
v4.10.1-release
v4.10.2-release
v4.10.3-release
v4.12.1-release
v4.12.2-release
v4.12.3-release
v4.12.4-release
v4.12.5-release
v4.14.1-release
v4.16.1-release
v4.16.2-release
v4.17.0-release
v4.18-release
v4.19-release
v4.2.1-patch
v4.2.2-patch
v4.20-release
v4.21-release
v4.22-release
v4.23-release
v4.24-release
v4.25-release
v4.26-release
v4.27-release
v4.28-release
v4.29-release
v4.3.0-release
v4.3.1-release
v4.3.2-release
v4.3.3-release
v4.30-release
v4.31-release
v4.32-release
v4.33-release
v4.34-release
v4.35-release
v4.36-release
v4.37-release
v4.38-release
v4.39-release
v4.4.2-release
v4.40-release
v4.41-release
v4.42-release
v4.43-release
v4.44-release
v4.45-release
v4.46-release
v4.47-release
v4.48-release
v4.5.0-release
v4.5.1-release
v4.6.0-release
v4.8.0-release
v4.8.2-release
v4.9.1
v4.9.2-release
warn-pre-allocation
whisper_chunking
whisper_out_of_range
wip_test_safetensors_rc
xenova-patch-1
xla_concrete_fn_dynamic_shape_debug
ydshieh-push-ci-image
ydshieh_check_run_nightly_ci_test_new_runner
yih-dar-try-compile_models
younes-opt-350-m
younes-test-workflow
younesbelkada-patch-1
zach-accelerate-integration
0.1.2
0.5.0
1.0
1.1.0
1.2.0
3.0.1
4.3.0.rc1
list
localattn1
v0.1.2
v0.2.0
v0.3.0
v0.4.0
v0.5.0
v0.5.1
v0.6.0
v0.6.1
v0.6.2
v1.0.0
v2.0.0
v2.1.0
v2.1.1
v2.10.0
v2.11.0
v2.2.0
v2.2.1
v2.2.2
v2.3.0
v2.4.0
v2.4.1
v2.5.0
v2.5.1
v2.6.0
v2.7.0
v2.8.0
v2.9.0
v2.9.1
v3.0.0
v3.0.1
v3.0.2
v3.1.0
v3.2.0
v3.3.0
v3.3.1
v3.4.0
v3.5.0
v3.5.1
v4.0.0
v4.0.0-rc-1
v4.0.1
v4.1.0
v4.1.1
v4.10.0
v4.10.1
v4.10.2
v4.10.3
v4.11.0
v4.11.1
v4.11.2
v4.11.3
v4.12.0
v4.12.1
v4.12.2
v4.12.3
v4.12.4
v4.12.5
v4.13.0
v4.14.0
v4.14.1
v4.15.0
v4.16.0
v4.16.1
v4.16.2
v4.17.0
v4.18.0
v4.19.0
v4.19.1
v4.19.2
v4.19.3
v4.19.4
v4.2.0
v4.2.1
v4.2.2
v4.20.0
v4.20.1
v4.21.0
v4.21.1
v4.21.2
v4.21.3
v4.22.0
v4.22.1
v4.22.2
v4.23.0
v4.23.1
v4.24.0
v4.25.1
v4.26.0
v4.26.1
v4.27.0
v4.27.1
v4.27.2
v4.27.3
v4.27.4
v4.28.0
v4.28.1
v4.29.0
v4.29.1
v4.29.2
v4.3.0
v4.3.0.rc1
v4.3.1
v4.3.2
v4.3.3
v4.30.0
v4.30.1
v4.30.2
v4.31.0
v4.32.0
v4.32.1
v4.33.0
v4.33.1
v4.33.2
v4.33.3
v4.34.0
v4.34.1
v4.35.0
v4.35.1
v4.35.2
v4.36.0
v4.36.1
v4.36.2
v4.37.0
v4.37.1
v4.37.2
v4.38.0
v4.38.1
v4.38.2
v4.39.0
v4.39.1
v4.39.2
v4.39.3
v4.4.0
v4.4.1
v4.4.2
v4.40.0
v4.40.1
v4.40.2
v4.41.0
v4.41.1
v4.41.2
v4.42.0
v4.42.1
v4.42.2
v4.42.3
v4.42.4
v4.43.0
v4.43.1
v4.43.2
v4.43.3
v4.43.4
v4.44.0
v4.44.1
v4.44.2
v4.45.0
v4.45.1
v4.45.2
v4.46.0
v4.46.1
v4.46.2
v4.46.3
v4.47.0
v4.47.1
v4.48.0
v4.48.1
v4.48.2
v4.48.3
v4.5.0
v4.5.1
v4.6.0
v4.6.1
v4.7.0
v4.8.0
v4.8.1
v4.8.2
v4.9.0
v4.9.1
v4.9.2
-
d6f446ffa7
when filtering we can't use the convert script as we removed them
Arthur Zucker
2025-01-10 11:29:31 +0100 -
8ce1e9578a
[test-all]
Arthur Zucker
2025-01-10 11:20:41 +0100 -
af2d7caff3
Add Moonshine (#34784)
eustlb
2025-01-10 11:00:54 +0100 -
42b8e7916b
ModernBert: reuse GemmaRotaryEmbedding via modular + Integration tests (#35459)
Tom Aarsen
2025-01-10 10:25:10 +0100 -
e39c9f7a78
v4.48-release
Arthur Zucker
2025-01-10 10:12:04 +0100 -
26c76151d2
fix
no_overwrite_test_batching_equivalence
ydshieh
2025-01-09 14:07:59 +0100 -
c982243b40more robust fix-device-map
Cyril Vallez
2025-01-09 14:06:07 +0100 -
7deee60a04style
Cyril Vallez
2025-01-09 13:52:00 +0100 -
196cf39446style
Cyril Vallez
2025-01-09 13:47:24 +0100 -
b902568a1dUpdate modeling_utils.py
Cyril Vallez
2025-01-09 13:42:06 +0100 -
7599f0d156default device for rotary
Cyril Vallez
2025-01-09 13:40:38 +0100 -
7a97d86140Merge branch 'main' into secure-amd-ci
ivarflakstad
2025-01-06 11:16:32 +0100 -
0f5f322c16Disable self-scheduled-amd-caller.yml temp-disable-scheduled-amd-ci
ivarflakstad
2025-01-06 11:10:34 +0100 -
90f2781aaf
Modular files
init_round_5
Lysandre
2025-01-05 18:33:42 +0100 -
e0d87fd988Testing safetensors 0.5.0rc0 test_safetensors_0.5.0
Nicolas Patry
2025-01-02 16:40:43 +0100 -
f6d0607530
run_ci
fix_docker_autoawq
MekkCyber
2024-12-25 13:09:45 +0000 -
f6e0a11b18
fix
MekkCyber
2024-12-25 11:31:32 +0000 -
20876c7156
fix_docker
MekkCyber
2024-12-25 10:42:37 +0000 -
b2d0e283e9
Add option of specifying result upload repo
Ivar Flakstad
2024-12-20 18:24:33 +0100 -
d9ffefad5eFix syntax in HfQuantizer docstring albertvillanova-patch-1
Albert Villanova del Moral
2024-12-19 10:58:06 +0100 -
b6381e3c9dMerge branch 'main' into whisper_out_of_range whisper_out_of_range
eustlb
2024-12-18 16:54:15 +0100 -
b56e46dbe8
fixing test
fix_falcon_processor
MekkCyber
2024-12-18 09:46:06 +0000 -
7c99fd066f
temp
temp-kosmos25
ydshieh
2024-12-17 18:17:35 +0100 -
a65a9b11d3
temp
ydshieh
2024-12-17 17:49:49 +0100 -
30f927a54a
temp
ydshieh
2024-12-17 17:38:31 +0100 -
a3638eab9d
temp
ydshieh
2024-12-17 17:25:54 +0100 -
876cb6b217
temp
ydshieh
2024-12-17 16:36:00 +0100 -
ce222a6990
temp
ydshieh
2024-12-17 16:33:05 +0100 -
9b29aacce3
temp
ydshieh
2024-12-17 16:18:37 +0100 -
bf14c4b95a
temp
ydshieh
2024-12-17 16:14:37 +0100 -
db865dbeda
temp
ydshieh
2024-12-17 16:12:47 +0100 -
7f0d26c55e
temp
ydshieh
2024-12-17 16:06:31 +0100 -
0ec499a841
temp
ydshieh
2024-12-17 15:55:43 +0100 -
5f731a9aa9
temp
ydshieh
2024-12-17 15:45:43 +0100 -
6b2f7d79e2
temp
ydshieh
2024-12-17 15:28:45 +0100 -
2d4cbba164
temp
ydshieh
2024-12-17 15:26:01 +0100 -
83d600e5f8
temp
ydshieh
2024-12-17 15:22:53 +0100 -
55944fcf87
temp
ydshieh
2024-12-17 15:19:54 +0100 -
c356a36327
temp
ydshieh
2024-12-17 15:14:47 +0100 -
b2c3db2990
temp
ydshieh
2024-12-17 14:51:26 +0100 -
39dc6ef257
temp
ydshieh
2024-12-17 14:47:48 +0100 -
9ddc86b560
temp
ydshieh
2024-12-17 13:30:32 +0100 -
d5b834925c
temp
ydshieh
2024-12-17 13:23:06 +0100 -
3a58742f92
temp
ydshieh
2024-12-17 12:52:54 +0100 -
d1c52f4ffc
temp
ydshieh
2024-12-17 12:38:01 +0100 -
241c04d368
[Whisper] patch float type on mps (#35295)
v4.47.1
v4.47-release
eustlb
2024-12-16 16:52:47 +0100 -
b688c4f564
Merge branch 'ca03842c' into kosmos25
ydshieh
2024-12-16 17:02:08 +0100 -
c639eeb73e
it's Monday let's go
ydshieh
2024-12-16 17:00:01 +0100 -
8a058d9d56
it's Monday let's go
ydshieh
2024-12-16 16:35:17 +0100 -
395a6365b0
it's Monday let's go
ydshieh
2024-12-16 16:23:18 +0100 -
76a9fdcbc5
Revert amd push ci changes
Ivar Flakstad
2024-12-16 13:54:53 +0100 -
c632572874
Merge branch 'main' into secure-amd-ci
Ivar Flakstad
2024-12-16 13:52:10 +0100 -
a1ad329833
Test hfh v0.27.0.rc1
ci-test-huggingface-hub-v0.27.0.rc1
Celina Hanouti
2024-12-16 12:36:48 +0100 -
0e762a020f
trigger ci
use-hfh-loading-saving-state-dict-helpers
Celina Hanouti
2024-12-16 11:38:28 +0100 -
e130c8bbee
run tests while keeping generate_kwargs
Celina Hanouti
2024-12-16 11:27:45 +0100 -
2c47915424
it's Friday night, let cross finger
ydshieh
2024-12-13 19:39:05 +0100 -
1b6cb1eefc
don't use no_sync when deepspeed doesn't support it for certain zero stages (#35157)
Wing Lian
2024-12-13 13:23:00 -0500 -
b1d5d6dd65
Fix FSDP no longer working (#35212)
Zach Mueller
2024-12-13 13:20:51 -0500 -
9c8aff7cf9
it's Friday night, let cross finger
ydshieh
2024-12-13 19:06:30 +0100 -
00e324db90
it's Friday night, let cross finger
ydshieh
2024-12-13 18:35:53 +0100 -
90c4fcc29c
it's Friday night, let cross finger
ydshieh
2024-12-13 18:29:22 +0100 -
ce3a6b0ab7
it's Friday night, let cross finger
ydshieh
2024-12-13 18:28:20 +0100 -
fbb3e592af
it's Friday night, let cross finger
ydshieh
2024-12-13 18:20:21 +0100 -
f8c98d6173
it's Friday night, let cross finger
ydshieh
2024-12-13 17:58:05 +0100 -
ad0f08e02b
Test hfh v0.27.0.rc0
ci-test-huggingface-hub-v0.27.0.rc0
Celina Hanouti
2024-12-13 17:32:06 +0100 -
b1db4f22b6
fix
ydshieh
2024-12-13 16:56:06 +0100 -
85da449436
fix
ydshieh
2024-12-13 16:37:28 +0100 -
e3802f4baa
fix
ydshieh
2024-12-13 15:56:08 +0100 -
91fa38341a
fix
ydshieh
2024-12-13 15:35:00 +0100 -
bd47e63fbf
ignore formatter
fix-Seq2SeqTrainingArguments-doc
Quentin Gallouédec
2024-12-13 14:30:27 +0000 -
dcced48507
fix
ydshieh
2024-12-13 15:09:42 +0100 -
5060a334de
remove layer_idx
llama-refactor
Cyril Vallez
2024-12-13 14:07:01 +0000 -
a1cc7ebbb6
try fix Seq2SeqTrainingArguments
Quentin Gallouédec
2024-12-13 13:37:42 +0000 -
31978f94e4
add docstring
Celina Hanouti
2024-12-13 13:34:07 +0100 -
61ab4e2849
fix tests
Celina Hanouti
2024-12-13 13:29:13 +0100 -
356c1bc85a
Use rocm 6.3 as base amd image and add nvidia-ml-py to exclude list
build_ci_docker_image_amd1
Ivar Flakstad
2024-12-13 12:28:34 +0100 -
7394401d24
add hfh loading state dict helpers
Celina Hanouti
2024-12-13 11:43:16 +0100 -
caaa5e5508
tgi update
Cyril Vallez
2024-12-12 18:29:26 +0000 -
95cb944ee6
be permissive
Arthur Zucker
2024-12-12 11:33:37 +0100 -
584b443096
fix unpack imoprt
Arthur Zucker
2024-12-12 10:43:13 +0100 -
57eece66af
Merge branch 'llama-refactor' of github.com:huggingface/transformers into llama-refactor
Arthur Zucker
2024-12-12 10:36:54 +0100 -
9461039d87
nits
Arthur Zucker
2024-12-12 10:36:49 +0100 -
f7395cc0ccMerge branch 'main' into llama-refactor
Arthur
2024-12-12 14:57:58 +0530 -
4f36712da1
nit?
Arthur Zucker
2024-12-12 10:24:11 +0100 -
2016bc47d0
default init weights
Arthur Zucker
2024-12-12 10:18:38 +0100 -
53450ac365
fix
Arthur Zucker
2024-12-12 10:14:20 +0100 -
1a5a834f53
fix auto?
Arthur Zucker
2024-12-12 09:53:53 +0100 -
3f68c7cf72
9 left!
Arthur Zucker
2024-12-12 09:44:14 +0100 -
c224f36d10
fix some tests
Arthur Zucker
2024-12-12 09:39:36 +0100 -
725d00caf4
fix some stuff
Arthur Zucker
2024-12-12 09:22:04 +0100 -
6028e85990
fixup
Arthur Zucker
2024-12-11 19:50:04 +0100 -
7a608da9f8
update
Arthur Zucker
2024-12-11 19:44:29 +0100 -
e9d751abaa
fix attention_mask
Arthur Zucker
2024-12-11 19:26:39 +0100 -
60189825d7
fix!
Arthur Zucker
2024-12-11 19:09:09 +0100 -
d9156363bf
mm
Arthur Zucker
2024-12-11 18:49:37 +0100 -
20c512bc80
clean
Arthur Zucker
2024-12-11 18:07:53 +0100 -
d786f26a00
Empty commit
muellerzr-network-retry
[[ -z $EMAIL ]] && read -e -p "Enter your email (for git configuration): " EMAIL
2024-12-11 12:00:27 -0500 -
2df4b507e7
Empty commit
[[ -z $EMAIL ]] && read -e -p "Enter your email (for git configuration): " EMAIL
2024-12-11 12:00:25 -0500 -
8381165040
Merge remote-tracking branch 'origin/main' into dduf-compability
dduf-compability
Marc Sun
2024-12-11 17:00:22 +0000 -
40f1845c2e
New approach
[[ -z $EMAIL ]] && read -e -p "Enter your email (for git configuration): " EMAIL
2024-12-11 11:48:02 -0500