mirror of
https://github.com/saymrwulf/transformers.git
synced 2026-05-14 20:58:08 +00:00
Commit graph
Select branches
Hide pull requests
'delete-delete-doc'
29625_add_prefix_space
29625_prefix_space
30824-spmconverter-user-defined-symbol
31187_depreciate_clean_up_tokenization_spaced
BritneyMuller-housekeeping-patch
LysandreJik-patch-1
_dummy_fix_weight_only_usage
_dummy_fix_weight_only_usage_2
add-deci-lm
add-flash-decoding
add-fp8-llama-script
add-git-lfs-to-amd-image
add-qgalore
add-rwkv5
add-warning-4bit-opti
add_amd_daily_ci
add_back_generative_class
add_deformable_detr
add_fa2_bart
add_important_warning_padding_attention_mask
add_kosmos_2_remote
add_kosmos_2_temp
add_kosmos_2_utm5_attn
add_kosmos_2_utm5_attn_rebased
add_kosmos_2_utm5_attn_rebased_flat_layer_structure
add_num_workers_for_tf
add_pipeline_equivalence_testing
add_prefix_space_29625
add_prefix_space_clean
add_siglip_fast_tokenizer_bis
add_tf_export_doc
add_word_level_timestamp_long
adding_fp8_quantization
agent_callback
agents-count-tokens
agents-make-easier-tags
agents-messages
albertvillanova-patch-1
allow_old_falcon_name
amd-nightly-ci
amdgpu-multi-gpu-tests
another_prepare_dataset_fix
api_big2
arijitx/wav2vec2_alignment
assistant_decoding_batch
attn-implementation-vision-enc-dec
auot-convert-tekken
auto-assign-reviewers
auto_gpt4_conversion
autoformer-test-seq-to-seq-add-atol
best_benchmark
best_benchmark_new
best_benchmark_on_static_cache
best_benchmark_on_static_cache_new
bloom_big
bos_eos_token_fix
bos_eos_token_slow
build-check-deepspeed-image
build-docker-torch-2.2
build_ci_docker_image_amd1
build_ci_docker_image_amd2
build_ci_docker_image_amd3
build_docker_on_kube
build_docker_on_kube_2
build_docker_on_kube_3
build_image_abc
byebye
byebye_py_37
cache_exp
change-ci
chat_template_kwargs
check-deepspeed
check-send-headers-when-converting-safetensors
check-whisper-slow-tests
check_amd_image_build
check_compile
check_compile_if_flaky
check_doc_test
check_docker_i
check_ds
check_example_ci
check_example_job
check_fastspeech
check_fix_fix_fix
check_fix_torch_pip
check_flaky
check_flax_example
check_gated_repo
check_gemma
check_gemma_compile
check_gemma_compile_2
check_gen_2
check_layoutlm
check_layoutlmv2
check_limit
check_mem
check_mem_00c1d87
check_mem_3cefac1d
check_mem_56b64bf
check_mem_838b87a
check_nightly_build
check_nightly_build_build_image
check_nougat
check_past_runner
check_permission
check_quant
check_quantized_param_bnb4
check_report
check_safetensors_rc
check_slow_pr
check_speed_no_empty
check_strange_doctest
check_tiny_creation
check_torch_2.2
check_trigger_4d8427f7
check_trigger_a81cf9ee
check_update_cache_number
check_ved_trocr
check_what_wrong_in_tiny_creation
checkout-layoutlm-tokenizers
chunk_length_ctc
ci-amdgpu-build-docker-images
ci-amdgpu-mi250
ci-amdgpu-nightly
ci-test-huggingface-hub-v0.15.0.rc0
ci-test-huggingface-hub-v0.16.0.rc0
ci-test-huggingface-hub-v0.17.0.rc0
ci-test-huggingface-hub-v0.18.0.rc0
ci-test-huggingface-hub-v0.19.0.rc0
ci-test-huggingface-hub-v0.20.0.rc1
ci-test-huggingface-hub-v0.21.0.rc0
ci-test-huggingface-hub-v0.22.0.rc0
ci-test-huggingface-hub-v0.23.0.rc0
ci-test-huggingface-hub-v0.23.0.rc1
ci-test-huggingface-hub-v0.24.0.rc0
ci-test-huggingface-hub-v0.25.0.rc0
ci-test-huggingface-hub-v0.25.0.rc1
ci-test-huggingface-hub-v0.26.0.rc0
ci-test-huggingface-hub-v0.27.0.rc0
ci-test-huggingface-hub-v0.27.0.rc1
ci-test-huggingface-hub-v0.27.0rc1
ci-test-huggingface-hub-v0.28.0.rc0
ci-test-huggingface-hub-v0.28.0.rc5
circleci_combine_reports
circleci_debug_base
circleci_debug_base_MobileNetV1ModelTest_test_batching_equivalence
circleci_debug_base_timm
circleci_debug_base_timm_3
clean_spmcoverter
cohere-diff
cohere-diff-2
compare_ci_with_torch_2.2
compile-rope
continuous-batching
custom_bloom_kernel
databricks
dduf-compability
dduf-compatibility-with-file-explorer
deberta-xla-fixes
debug_bloom
debug_get_jobs
debug_kosmos_2_output
debug_mem_0b192de1
debug_mem_95b37495
debug_metadata_run
debugdebug
debugdebug-2
debugdebug-5
deepseek_v2_support
deepspeed-amd-pytorch-version-fix
default-auto
default-fast-load
delete_big_tokenizer_block
deprecate_LegacyIndex
disable_multi_gpu
doc-builder
doc-link-one-or-two-papers-lysandre
doc-regactor
doc_builder_rename
doc_pr
docker_change_awq_version
docs-ctrl-lys
dont-use-deprecated-method
drop_py38_build_img_2
ds-fix-resume
ds-ignore_mismatched_sizes
dynamic_length_in_static_cache
dynamic_length_in_static_cache_001
dynamic_length_in_static_cache_002
dynamic_length_in_static_cache_reconstruct_tensors_from_length
dynamic_length_on_0ae789e0
dynamic_length_on_75bbfd5b
dynamic_length_on_95b3c381
dynamic_length_on_b6eb708b
enable_tf_numpy
faster_cache_without_compile
faster_copies
faster_set_initialized_submodules
fire
fix-Parameter-init
fix-Seq2SeqTrainingArguments-doc
fix-autoprocessor-import-order
fix-bnb-warning
fix-ci
fix-ci-setup
fix-copies
fix-device-map
fix-doc-builder-edit
fix-flash-comment
fix-from-pretrained
fix-gemma2-sdpa
fix-gemma2-sliding-window
fix-gpt2-scaled-init
fix-int8-serilation
fix-kwargs-issues
fix-llama-3-gguf
fix-pipeline-predict-transform-methods
fix-pixtral-tests
fix-pytorch-deepspeed-image
fix-quality-2
fix-red-ci-atol
fix-slow-tests-shieh-trigger
fix-task-mappings
fix-word-ids
fix-workflow
fix_TFMarianModelTest_test_xla_generate_slow
fix_aria_ci
fix_auto_test
fix_autoawq_docker
fix_autoawq_test
fix_bamba_test
fix_check_copies
fix_chinese_clip
fix_convert_spm_bpe
fix_deprecation_warnings
fix_dinat_2
fix_dinov2
fix_docker_autoawq
fix_docker_autogptq_from_source
fix_doctest
fix_doctest_based_on_refactor_doctest_2
fix_eetq_test
fix_falcon_processor
fix_flaky_4
fix_flaky_test_assisted_decoding_matches_greedy_search
fix_flaky_test_pt_tf_model_equivalence
fix_fp_32
fix_generate_embeds
fix_gptq_test
fix_gptq_tests
fix_jetmoe
fix_more_input_out
fix_not_init
fix_peft_model_in_pipelines
fix_pipe_tests_001
fix_quanto_llama27b
fix_remote_tool
fix_slow_gen_on_0ae789e0
fix_slow_gen_on_75bbfd5b
fix_slow_gen_on_b6eb708b
fix_st5_docs
fix_stupid_cond
fix_test_encode_decode
fix_test_fetcher_tests
fix_tie
fix_whisper_ci
fix_whisper_tflite_export
fix_zh_quicktour_md
flex_attention_qwen2
flex_attn_example
for_test_run_squad_no_trainer
force-convert
full-bf16-train
full_length_on_468f7cca
full_length_on_68b71c85
full_length_on_862cde4c
gemma_allow_compile
general_test_low_cpu_mem
get_bad_commits_for_daily_ci_11_20
get_bad_commits_for_daily_ci_11_26
gpt-flex-attention
gpt-mqa
gptneo_gpt4_port
gptneo_gpt4_port_new
hardware-auto-setup
hardware-auto-setup-ci
hotfix_ci_222
hqq_serialization
idefics3
ifix_aqlm_modules_to_not_convert
improve_error_message_asr_pipeline
improve_error_message_when_transformers_is_misconfigured
improve_torch_version_check
informative-detr-message
init_round_2
init_round_5
int
inverse_chat_templates
jeffboudier-transformers-docs-ad-copy
jnp_devicearray
keras-core-support
keras3_compatibility_phase_2
keras_3_compatibility
larger_runner
less-constraints
link-to-the-hub
llama-break-fix
llama-pad-side
llama-refactor
load_pretrainedfast_auto
make-cache-traceable
mark_whisper_test_slow
master
measure_all_tests
measure_gen
measure_gen_on_0ae789e0
measure_gen_on_75bbfd5b
measure_gen_on_b6eb708b
merge_text2text_into_text_generation
ministral
mitigate_tf_stride_vulnerability
modular-roberta
modular-stablelm
more_reduced_dummy_memory_usage
more_tf_int_dtypes
moshi-integration
move_jobs_from_daily_ci_channel
move_part_2
muellerzr-accum-plugin
muellerzr-ds-investigation
muellerzr-dummy-pr
muellerzr-enable-quant
muellerzr-enable-torchdata
muellerzr-fix-autocast
muellerzr-fix-integration-tests
muellerzr-fix-reentrant
muellerzr-fix-timeout
muellerzr-free-memory
muellerzr-free-memory-passthrough
muellerzr-jobs
muellerzr-less-fixes
muellerzr-lr-sched-right-version
muellerzr-metrics
muellerzr-modeling
muellerzr-more-ga-tests-fast
muellerzr-more-models-sadface
muellerzr-multinode-save
muellerzr-network-retry
muellerzr-skip-dvc
muellerzr-skip-failing-example
muellerzr-speedup-modular-conversion
muellerzr-trainer-refactor
muellerzr-transformers-should-not-set-env-variables
muellerzr-use-scientific
mymain
new-split
nezha_slow
nit-ga-condition
nit-modular-reame
nit-refactor
nit-remove-irrelevant-comment
nit_cleanup
nits-attention
no_more_shape_list
no_overwrite_test_batching_equivalence
noua/bloom_cugraph
np2
on_predict
onnx_gpt2_io_definition
output_ragged
pin-ffspec
pin-gguf
pin_ds
ping_author
ping_author_6
pipeline-revision-mirror
pipelines_signatures
pixtral_batchmixfeature_fix
pixtral_processor_structure_fix
post-action-build-test-tokenizers-main
processor-template-duplicated-tokens
protobuf-4
push-ci-image
quickfix_generate_tests
reenable_test
refactor-attention-converesion
refactor-from-pretrained
refactor_doctest_2
refactoring-new-version
relative-paths
remove-cache-migration-script
remove-items
remove-torch-pre-releases-amd-image
remove-warnings
repro-bug-pytorch-compile
repro-bug-pytorch-compile-cudagraph
reset_logger_level_2
resnet_with_variants
reverse_templating
revert-17547-update-support-image
revert-17646-skip_repo_not_found
revert-31494-add_dac
revert-33934-patch-1
revert-checkpoint-tmp-dir
revert-commit-30302
revert_hard_error2
robust_config_ckpt_check
run-amd
run-fix-Parameter-init
run-move-integrations
run_add_tts_pip
run_amd_push_ci_caller
run_amd_scheduled_ci_caller
run_amd_scheduled_ci_caller_testing
run_amd_scheduled_ci_caller_testing1
run_better_job_artifact_name
run_better_report
run_bon_courage
run_check_auto_mapping_importable
run_check_natten
run_ci_manually
run_daily_ci
run_daily_ci_11_20
run_daily_ci_11_21
run_deepspeed_ci
run_doctest_after_merge
run_doctest_ci
run_ds_ci
run_fc639143
run_fc639143_001
run_fc639143_002
run_fc639143_003
run_feat/kv_cache_class
run_fix_doc_on_circleci
run_fix_error_not_captured
run_nightly_ci_test_new_runner
run_no_job_name
run_past_ci_2nd
run_refactor_doctest
run_run_all_tests
run_run_amd_scheduled_ci_caller_deepspeed_test
run_scheduled_ci_now
run_scheduled_ci_now_2
run_scheduled_ci_now_3
run_scheduled_ci_now_4
run_scheduled_ci_now_5
run_scheduled_ci_now_6
run_sep_model_and_other_no_model_n_8_all_models
run_show_failure_better
run_split_daily_ci_based_on_no_job_name
run_split_daily_ci_based_on_no_job_name_2
run_tiny_with_fix_tiny_model_creation
run_torch_v_2_1
run_trigger_ci_when_tiny_summary_modified
run_truncate
run_update_tiny_002
run_use_main_in_conversion_script
safe_ci_report
safe_serialization_always_valid
safetensors-0.4.2
safetensors-step-2-2
safetensors_pre_release
safetensors_rc
scale
secure-amd-ci
shieh-length_in_compile
show_failure
simplify
simplify-contributions-init
simplify-contributions-inits
simplify-contributions-main-init
simplify-contributions-model_init
skip-tokenizer-test
skip_2_hub_tests
skip_blip2_torchscript
skip_idefics_doctest
sliding-window
smangrul/fix-auto-batch-finder-trainer-issue
smangrul/integrate-accelerate
smangrul/starcoder-int4-ddp-flash-attn
split_daily_ci
spmconverter_user_symbols
ssh_new_cluster
starcoder-2-fix
stas00-patch-1
state_spaces_call_for_contribution
stop-ci-on-fail-doc
stop-throwing-cache-warning
support-copy
sync-table-question-answering
sync_dqa_pipeline
sync_token_classification_and_zero_shot
sync_vqa_pipeline
t5-fp16-no-nans
temp-disable-scheduled-amd-ci
temp-kosmos25
temporary_pin_torch_2
tensor-cache
test-bin-format
test-build-ci-uv
test-datasets-2.14
test-datasets-2.21
test-datasets-3.0
test-datasets-main
test-datasets-pr
test-deepseek-fp8
test-doctests
test-eetq-dockerfile
test-fa2
test-huggingface_hub-pre-release
test-new-doc-builder-workflow
test-seentok
test-tokenizer-release
test-tokenizers-main
test_bc_tokenizers
test_ci
test_composition_2
test_composition_lysandre
test_composition_remote_tool
test_doc
test_docker_run_quantization
test_if_token
test_release_candidates
test_run_scheduler_ci
test_safetensors
test_safetensors_0.5.0
test_safetensors_abi3
test_tokenizers_0.19.0rc0
test_tokenizers_abi3
tf_forced_logits_xla_compatible
tf_int64_tests
tf_llama_port
tf_new_dummy_building
tf_quicktour_fix
tfconvnext
thomas/accelerate_gpt2
thomas/accelerate_gptj
thomas/add_custom_kernels
thomas/bloom_allow_fp32_lm_head
thomas/dirty_bloom_tp
thomas/fix_bloom
thomas/improve_bloom_generation_speed
thomas/llama
thomas/make_tp_bloom_generate_work
thomas/make_tp_work_with_bloom
tied_weights_load
tied_weights_warning_check
timm_wrapper_kwargs
tok-update
tokenizer-release
tokenizers_rc1
tools-inference-endpoints
torch-2.2-on-daily-ci
torch_versions
tp-loading
tp-support
trad_fixes
trainer-hyperparameter-search-kwargs-docs-update
trigger-amd-image-build
trigger_ci_with_torch_2_4
trigger_daily_ci
trigger_debug
trigger_disable_multi_gpu
trigger_doc
trigger_pt_10_past_ci
trigger_run_amd_scheduled_ci_caller_deepspeed_test
trigger_slow
trigger_test_cached_model_has_minimum_calls_to_head
trigger_upload_artifacts_3
try_comment_bot
try_fix_whisper_slow_test
try_matrix_fail
try_new_natten
try_new_natten_2
try_pydantic_v2_build_images
try_run_amd_push_ci_caller
try_sub
update-add-new-model
update-cooki
update-doc-gpu
update-from-pretrained
update-quantization-docker
update-special-tokens
update-tokenizers-version
update_27265
update_kosmos_2_file
update_llama_template
update_ssh
upgrade_tokenizers2
use-hfh-loading-saving-state-dict-helpers
use-process-retry-on-amd-smi
use-safetensors-from-pr
use-uv-
use_pt_25_image
v3.5.1hotfix
v4.0.0-release
v4.0.1-release
v4.10.0
v4.10.0-release
v4.10.1-release
v4.10.2-release
v4.10.3-release
v4.12.1-release
v4.12.2-release
v4.12.3-release
v4.12.4-release
v4.12.5-release
v4.14.1-release
v4.16.1-release
v4.16.2-release
v4.17.0-release
v4.18-release
v4.19-release
v4.2.1-patch
v4.2.2-patch
v4.20-release
v4.21-release
v4.22-release
v4.23-release
v4.24-release
v4.25-release
v4.26-release
v4.27-release
v4.28-release
v4.29-release
v4.3.0-release
v4.3.1-release
v4.3.2-release
v4.3.3-release
v4.30-release
v4.31-release
v4.32-release
v4.33-release
v4.34-release
v4.35-release
v4.36-release
v4.37-release
v4.38-release
v4.39-release
v4.4.2-release
v4.40-release
v4.41-release
v4.42-release
v4.43-release
v4.44-release
v4.45-release
v4.46-release
v4.47-release
v4.48-release
v4.5.0-release
v4.5.1-release
v4.6.0-release
v4.8.0-release
v4.8.2-release
v4.9.1
v4.9.2-release
warn-pre-allocation
whisper_chunking
whisper_out_of_range
wip_test_safetensors_rc
xenova-patch-1
xla_concrete_fn_dynamic_shape_debug
ydshieh-push-ci-image
ydshieh_check_run_nightly_ci_test_new_runner
yih-dar-try-compile_models
younes-opt-350-m
younes-test-workflow
younesbelkada-patch-1
zach-accelerate-integration
0.1.2
0.5.0
1.0
1.1.0
1.2.0
3.0.1
4.3.0.rc1
list
localattn1
v0.1.2
v0.2.0
v0.3.0
v0.4.0
v0.5.0
v0.5.1
v0.6.0
v0.6.1
v0.6.2
v1.0.0
v2.0.0
v2.1.0
v2.1.1
v2.10.0
v2.11.0
v2.2.0
v2.2.1
v2.2.2
v2.3.0
v2.4.0
v2.4.1
v2.5.0
v2.5.1
v2.6.0
v2.7.0
v2.8.0
v2.9.0
v2.9.1
v3.0.0
v3.0.1
v3.0.2
v3.1.0
v3.2.0
v3.3.0
v3.3.1
v3.4.0
v3.5.0
v3.5.1
v4.0.0
v4.0.0-rc-1
v4.0.1
v4.1.0
v4.1.1
v4.10.0
v4.10.1
v4.10.2
v4.10.3
v4.11.0
v4.11.1
v4.11.2
v4.11.3
v4.12.0
v4.12.1
v4.12.2
v4.12.3
v4.12.4
v4.12.5
v4.13.0
v4.14.0
v4.14.1
v4.15.0
v4.16.0
v4.16.1
v4.16.2
v4.17.0
v4.18.0
v4.19.0
v4.19.1
v4.19.2
v4.19.3
v4.19.4
v4.2.0
v4.2.1
v4.2.2
v4.20.0
v4.20.1
v4.21.0
v4.21.1
v4.21.2
v4.21.3
v4.22.0
v4.22.1
v4.22.2
v4.23.0
v4.23.1
v4.24.0
v4.25.1
v4.26.0
v4.26.1
v4.27.0
v4.27.1
v4.27.2
v4.27.3
v4.27.4
v4.28.0
v4.28.1
v4.29.0
v4.29.1
v4.29.2
v4.3.0
v4.3.0.rc1
v4.3.1
v4.3.2
v4.3.3
v4.30.0
v4.30.1
v4.30.2
v4.31.0
v4.32.0
v4.32.1
v4.33.0
v4.33.1
v4.33.2
v4.33.3
v4.34.0
v4.34.1
v4.35.0
v4.35.1
v4.35.2
v4.36.0
v4.36.1
v4.36.2
v4.37.0
v4.37.1
v4.37.2
v4.38.0
v4.38.1
v4.38.2
v4.39.0
v4.39.1
v4.39.2
v4.39.3
v4.4.0
v4.4.1
v4.4.2
v4.40.0
v4.40.1
v4.40.2
v4.41.0
v4.41.1
v4.41.2
v4.42.0
v4.42.1
v4.42.2
v4.42.3
v4.42.4
v4.43.0
v4.43.1
v4.43.2
v4.43.3
v4.43.4
v4.44.0
v4.44.1
v4.44.2
v4.45.0
v4.45.1
v4.45.2
v4.46.0
v4.46.1
v4.46.2
v4.46.3
v4.47.0
v4.47.1
v4.48.0
v4.48.1
v4.48.2
v4.48.3
v4.5.0
v4.5.1
v4.6.0
v4.6.1
v4.7.0
v4.8.0
v4.8.1
v4.8.2
v4.9.0
v4.9.1
v4.9.2
-
7a911efddf
update
Arthur Zucker
2024-12-11 17:39:40 +0100 -
10e2fb75c1
Add retry torch decorator
[[ -z $EMAIL ]] && read -e -p "Enter your email (for git configuration): " EMAIL
2024-12-11 11:34:13 -0500 -
89d32d6825
fix auto set
Arthur Zucker
2024-12-11 17:30:26 +0100 -
3bbae39539
remove tanh
Arthur Zucker
2024-12-11 17:24:56 +0100 -
e5d60b4f23
fix
Arthur Zucker
2024-12-11 17:07:20 +0100 -
4b9a429a1c
style
Arthur Zucker
2024-12-11 16:54:35 +0100 -
1ef18f49a9
style
Arthur Zucker
2024-12-11 16:53:02 +0100 -
28829d2dd6
there was an issue with tie weight keys
Arthur Zucker
2024-12-11 16:44:04 +0100 -
40154815cb
revert some stuff
Arthur Zucker
2024-12-11 16:23:18 +0100 -
38dd294dd7
fix
Arthur Zucker
2024-12-11 16:10:40 +0100 -
1baabd3207
update
Arthur Zucker
2024-12-11 15:13:39 +0100 -
dcf7a37ce1
cache concatenates on the wrong axis
Arthur Zucker
2024-12-11 14:38:26 +0100 -
f61a5fec41
pass attention
Arthur Zucker
2024-12-11 14:37:12 +0100 -
556aa4ec2d
updates
Arthur Zucker
2024-12-11 14:35:53 +0100 -
341b8ce9fa
nits
Arthur Zucker
2024-12-11 14:27:20 +0100 -
56c1b1fbef
Round 4
init_round_2
Lysandre
2024-12-11 14:20:48 +0100 -
0418f97553
make auto for causal lm work
Arthur Zucker
2024-12-11 14:18:41 +0100 -
39ab8b757b
oupts
Arthur Zucker
2024-12-11 13:58:09 +0100 -
13a195a7bb
_output_embedding and _input_embeding
Arthur Zucker
2024-12-11 13:53:35 +0100 -
893ef382c4
nits
Arthur Zucker
2024-12-11 13:47:59 +0100 -
4e681b9c72
nits
Arthur Zucker
2024-12-11 13:38:19 +0100 -
0384db9c0c
more refactoring
Arthur Zucker
2024-12-11 12:39:07 +0100 -
f446bd4c00
only change lLlama
Arthur Zucker
2024-12-11 12:20:51 +0100 -
bf5d7c3fa3
Only import torch.distributed if it is available (#35133)
Gaétan Lepage
2024-12-10 18:19:30 +0100 -
8c269a0072
test datasets@main
test-datasets-main
Quentin Lhoest
2023-07-24 12:16:00 +0200 -
a319d9cd10Merge branch 'main' into flex_attention_qwen2 flex_attention_qwen2
Mohamed Mekkouri
2024-12-10 16:36:07 +0100 -
93a233e82c
add_dtype_check
check_quantized_param_bnb4
MekkCyber
2024-12-10 15:07:17 +0000 -
49952300bb
v4.47.1
Arthur Zucker
2024-12-10 08:41:52 +0100 -
d5ccfcc39a
Fix
num_items_in_batchnot being an integer (#35115)
Spiros Dontas
2024-12-10 09:40:40 +0200 -
c8ed11a277draft to test dduf compatibility with file explorer dduf-compatibility-with-file-explorer
Wauplin
2024-12-09 18:09:07 +0100 -
48833071c0
temporary solution to handle saving file from dduf format
Marc Sun
2024-12-09 15:20:48 +0000 -
0485b6e881
Fix GA loss bugs and add unit test (#35121)
kang sheng
2024-12-09 16:57:41 +0800 -
f2c402aa49
fix style
ifix_aqlm_modules_to_not_convert
MekkCyber
2024-12-09 09:05:49 +0000 -
93fb98d927
use models_to_not_convert
MekkCyber
2024-12-09 09:01:37 +0000 -
ebad35797f
fixing_qwen2moe
MekkCyber
2024-12-08 22:41:36 +0000 -
32ed852df0
add_flexattention_qwen
MekkCyber
2024-12-08 21:46:53 +0000 -
734a186fd2
fix a few issues
Marc Sun
2024-12-06 16:31:51 +0000 -
9a841add0a
fix
ydshieh
2024-12-06 17:13:32 +0100 -
6ed504dbce
fix
ydshieh
2024-12-06 16:19:28 +0100 -
6054220b77
Revert deletion of self-push-amd.yml for now
run_amd_scheduled_ci_caller_testing1
Ivar Flakstad
2024-12-06 16:02:47 +0100 -
925e14a0f5Merge branch 'main' into main
Yih-Dar
2024-12-06 15:30:02 +0100 -
943231a1ff
fix adapter path in case we have peft installed
Marc Sun
2024-12-06 13:42:45 +0100 -
4866c7ba49
use mmap instead
Marc Sun
2024-12-06 12:35:52 +0000 -
0b9e5adaa0
Merge branch 'main' into kosmos25
ydshieh
2024-12-06 10:42:13 +0100 -
f6b4b5754b
nit
nit-ga-condition
Arthur Zucker
2024-12-06 13:11:58 +0530 -
e7af32f234
fix
fix_flaky_test_pt_tf_model_equivalence
ydshieh
2024-12-06 06:25:03 +0100 -
723b9e2d3a
fix
ydshieh
2024-12-05 21:39:39 +0100 -
36d404f373
fix
ydshieh
2024-12-05 21:27:49 +0100 -
f3ff530a45
[run-slow] pixtral
pixtral_processor_structure_fix
Matt
2024-12-05 18:45:21 +0000 -
6769700a16
Correct nesting in test
Matt
2024-12-05 18:41:21 +0000 -
af9f67c9d9
Correct nesting in test
Matt
2024-12-05 18:40:35 +0000 -
3406432db3
More error handling
Matt
2024-12-05 18:36:06 +0000 -
031fdd5e10
make fixup
Matt
2024-12-05 18:32:42 +0000 -
ed0b4303e3
Fix the structure of images output by the processor
Matt
2024-12-05 18:31:08 +0000 -
49055e150d
Fix the structure of images output by the processor
Matt
2024-12-05 18:19:10 +0000 -
8e07742afa
Comment on processor test
pixtral_batchmixfeature_fix
Matt
2024-12-05 17:50:04 +0000 -
31858be2c0
No more unsqueezing
Matt
2024-12-04 18:33:57 +0000 -
d9f165af99
[run-slow] pixtral
Matt
2024-12-03 18:23:39 +0000 -
c0515cebcd
Add test
Matt
2024-12-03 18:08:38 +0000 -
9cd45c8b48
Correctly pass device arg during recursion
Matt
2024-12-03 18:07:28 +0000 -
0837c7e442
make fixup
Matt
2024-12-03 17:54:46 +0000 -
8041515fd7
Fix incorrectly inserted device arg
Matt
2024-12-03 17:54:31 +0000 -
7158f7488f
make fixup
Matt
2024-12-03 17:52:06 +0000 -
19876ea405
Fix case of nested tensors in BatchMixFeature
Matt
2024-12-03 17:49:47 +0000 -
ab0f65f05d
switch to huggingface hub api
Marc Sun
2024-12-05 17:53:23 +0000 -
5d7739f15a
Release: v4.47.0
v4.47.0
Lysandre
2024-12-05 18:17:54 +0100 -
2a9383853dMerge branch 'main' into secure-amd-ci
ivarflakstad
2024-12-05 18:08:18 +0100 -
8ee5e2ff6e
dduf compat for models and clip + t5 tokenizer
Marc Sun
2024-12-04 21:23:46 +0000 -
a1c0f64b93
fixing_falcon_processor
MekkCyber
2024-12-04 15:27:58 +0000 -
32b371863f
Use hf-workflows for both push and scheduled AMD CI
Ivar Flakstad
2024-12-04 13:35:23 +0100 -
d38ed44e9d
Use AMD CI workflow defined in hf-workflows
Ivar Flakstad
2024-12-03 14:22:04 +0100 -
4829e47952
Late-night bugfix on financial RL environment (transformers)
master
saymrwulf
2024-12-01 21:20:00 +0100 -
315624af07
Trying out boneh-franklin approach for IBE (ref. 2003 paper) (transformers)
saymrwulf
2024-12-01 03:32:00 +0100 -
7b139842c7
Implementing approach from a new paper read last night (transformers)
saymrwulf
2024-12-01 08:00:00 +0100 -
a491b27690
Quick fix, referencing a known issue from the official repo (transformers)
saymrwulf
2024-11-29 22:50:00 +0100 -
5139db5e0c
fix
fix_flaky_test_assisted_decoding_matches_greedy_search
ydshieh
2024-11-29 18:12:14 +0100 -
640897d330
fix
ydshieh
2024-11-29 18:04:50 +0100 -
e1161f20d1
fix
ydshieh
2024-11-29 18:03:22 +0100 -
5ec58969ee
fix
ydshieh
2024-11-29 18:02:33 +0100 -
c380280ab0
fix
ydshieh
2024-11-29 16:55:29 +0100 -
d37c8fb890
fix
ydshieh
2024-11-29 15:55:07 +0100 -
c40a12e3b8
fix
ydshieh
2024-11-29 14:46:16 +0100 -
8d9e49a113
fix
ydshieh
2024-11-29 13:24:19 +0100 -
8206e06e5b
[push-ci-image]
push-ci-image
Pavel Iakubovskii
2024-11-29 12:06:34 +0000 -
7662fb9b9a
fix
ydshieh
2024-11-29 13:00:19 +0100 -
68fe796209
fix
ydshieh
2024-11-29 12:43:58 +0100 -
256d65101c
fix
ydshieh
2024-11-29 12:28:33 +0100 -
8cb6e9e079
fix
ydshieh
2024-11-29 11:57:41 +0100 -
50d2e54675
fix
ydshieh
2024-11-29 11:56:21 +0100 -
6f648cb7a0
fix
ydshieh
2024-11-29 11:35:08 +0100 -
c8f5658b5a
fix
ydshieh
2024-11-29 11:21:32 +0100 -
a37afef202
fix
ydshieh
2024-11-29 10:46:20 +0100 -
61422b7f26
fix
ydshieh
2024-11-29 10:10:54 +0100 -
27fe21f27d
fix
ydshieh
2024-11-29 09:31:02 +0100 -
e60bb24d62
fix
ydshieh
2024-11-29 09:08:53 +0100 -
48cd75bd47
Late-night bugfix on financial RL environment (transformers)
saymrwulf
2024-11-29 07:12:00 +0100 -
f60f22b551
Implementing approach from a new paper read last night (transformers)
saymrwulf
2024-11-29 02:49:00 +0100 -
9d664542e1
Testing bigger LLM config, referencing 'Attention Is All You Need' (transformers)
saymrwulf
2024-11-29 22:54:00 +0100 -
44bc636fcc
fix
fix_flaky_4
ydshieh
2024-11-28 17:59:07 +0100 -
835669889d
fix
ydshieh
2024-11-28 17:52:49 +0100