transformers

saymrwulf/transformers

Fork 0

mirror of https://github.com/saymrwulf/transformers.git synced 2026-05-14 20:58:08 +00:00

Commit graph

Select branches

Hide pull requests

'delete-delete-doc'

29625_add_prefix_space

29625_prefix_space

30824-spmconverter-user-defined-symbol

31187_depreciate_clean_up_tokenization_spaced

BritneyMuller-housekeeping-patch

LysandreJik-patch-1

_dummy_fix_weight_only_usage

_dummy_fix_weight_only_usage_2

add-deci-lm

add-flash-decoding

add-fp8-llama-script

add-git-lfs-to-amd-image

add-qgalore

add-rwkv5

add-warning-4bit-opti

add_amd_daily_ci

add_back_generative_class

add_deformable_detr

add_fa2_bart

add_important_warning_padding_attention_mask

add_kosmos_2_remote

add_kosmos_2_temp

add_kosmos_2_utm5_attn

add_kosmos_2_utm5_attn_rebased

add_kosmos_2_utm5_attn_rebased_flat_layer_structure

add_num_workers_for_tf

add_pipeline_equivalence_testing

add_prefix_space_29625

add_prefix_space_clean

add_siglip_fast_tokenizer_bis

add_tf_export_doc

add_word_level_timestamp_long

adding_fp8_quantization

agent_callback

agents-count-tokens

agents-make-easier-tags

agents-messages

albertvillanova-patch-1

allow_old_falcon_name

amd-nightly-ci

amdgpu-multi-gpu-tests

another_prepare_dataset_fix

api_big2

arijitx/wav2vec2_alignment

assistant_decoding_batch

attn-implementation-vision-enc-dec

auot-convert-tekken

auto-assign-reviewers

auto_gpt4_conversion

autoformer-test-seq-to-seq-add-atol

best_benchmark

best_benchmark_new

best_benchmark_on_static_cache

best_benchmark_on_static_cache_new

bloom_big

bos_eos_token_fix

bos_eos_token_slow

build-check-deepspeed-image

build-docker-torch-2.2

build_ci_docker_image_amd1

build_ci_docker_image_amd2

build_ci_docker_image_amd3

build_docker_on_kube

build_docker_on_kube_2

build_docker_on_kube_3

build_image_abc

byebye

byebye_py_37

cache_exp

change-ci

chat_template_kwargs

check-deepspeed

check-send-headers-when-converting-safetensors

check-whisper-slow-tests

check_amd_image_build

check_compile

check_compile_if_flaky

check_doc_test

check_docker_i

check_ds

check_example_ci

check_example_job

check_fastspeech

check_fix_fix_fix

check_fix_torch_pip

check_flaky

check_flax_example

check_gated_repo

check_gemma

check_gemma_compile

check_gemma_compile_2

check_gen_2

check_layoutlm

check_layoutlmv2

check_limit

check_mem

check_mem_00c1d87

check_mem_3cefac1d

check_mem_56b64bf

check_mem_838b87a

check_nightly_build

check_nightly_build_build_image

check_nougat

check_past_runner

check_permission

check_quant

check_quantized_param_bnb4

check_report

check_safetensors_rc

check_slow_pr

check_speed_no_empty

check_strange_doctest

check_tiny_creation

check_torch_2.2

check_trigger_4d8427f7

check_trigger_a81cf9ee

check_update_cache_number

check_ved_trocr

check_what_wrong_in_tiny_creation

checkout-layoutlm-tokenizers

chunk_length_ctc

ci-amdgpu-build-docker-images

ci-amdgpu-mi250

ci-amdgpu-nightly

ci-test-huggingface-hub-v0.15.0.rc0

ci-test-huggingface-hub-v0.16.0.rc0

ci-test-huggingface-hub-v0.17.0.rc0

ci-test-huggingface-hub-v0.18.0.rc0

ci-test-huggingface-hub-v0.19.0.rc0

ci-test-huggingface-hub-v0.20.0.rc1

ci-test-huggingface-hub-v0.21.0.rc0

ci-test-huggingface-hub-v0.22.0.rc0

ci-test-huggingface-hub-v0.23.0.rc0

ci-test-huggingface-hub-v0.23.0.rc1

ci-test-huggingface-hub-v0.24.0.rc0

ci-test-huggingface-hub-v0.25.0.rc0

ci-test-huggingface-hub-v0.25.0.rc1

ci-test-huggingface-hub-v0.26.0.rc0

ci-test-huggingface-hub-v0.27.0.rc0

ci-test-huggingface-hub-v0.27.0.rc1

ci-test-huggingface-hub-v0.27.0rc1

ci-test-huggingface-hub-v0.28.0.rc0

ci-test-huggingface-hub-v0.28.0.rc5

circleci_combine_reports

circleci_debug_base

circleci_debug_base_MobileNetV1ModelTest_test_batching_equivalence

circleci_debug_base_timm

circleci_debug_base_timm_3

clean_spmcoverter

cohere-diff

cohere-diff-2

compare_ci_with_torch_2.2

compile-rope

continuous-batching

custom_bloom_kernel

databricks

dduf-compability

dduf-compatibility-with-file-explorer

deberta-xla-fixes

debug_bloom

debug_get_jobs

debug_kosmos_2_output

debug_mem_0b192de1

debug_mem_95b37495

debug_metadata_run

debugdebug

debugdebug-2

debugdebug-5

deepseek_v2_support

deepspeed-amd-pytorch-version-fix

default-auto

default-fast-load

delete_big_tokenizer_block

deprecate_LegacyIndex

disable_multi_gpu

doc-builder

doc-link-one-or-two-papers-lysandre

doc-regactor

doc_builder_rename

doc_pr

docker_change_awq_version

docs-ctrl-lys

dont-use-deprecated-method

drop_py38_build_img_2

ds-fix-resume

ds-ignore_mismatched_sizes

dynamic_length_in_static_cache

dynamic_length_in_static_cache_001

dynamic_length_in_static_cache_002

dynamic_length_in_static_cache_reconstruct_tensors_from_length

dynamic_length_on_0ae789e0

dynamic_length_on_75bbfd5b

dynamic_length_on_95b3c381

dynamic_length_on_b6eb708b

enable_tf_numpy

faster_cache_without_compile

faster_copies

faster_set_initialized_submodules

fire

fix-Parameter-init

fix-Seq2SeqTrainingArguments-doc

fix-autoprocessor-import-order

fix-bnb-warning

fix-ci

fix-ci-setup

fix-copies

fix-device-map

fix-doc-builder-edit

fix-flash-comment

fix-from-pretrained

fix-gemma2-sdpa

fix-gemma2-sliding-window

fix-gpt2-scaled-init

fix-int8-serilation

fix-kwargs-issues

fix-llama-3-gguf

fix-pipeline-predict-transform-methods

fix-pixtral-tests

fix-pytorch-deepspeed-image

fix-quality-2

fix-red-ci-atol

fix-slow-tests-shieh-trigger

fix-task-mappings

fix-word-ids

fix-workflow

fix_TFMarianModelTest_test_xla_generate_slow

fix_aria_ci

fix_auto_test

fix_autoawq_docker

fix_autoawq_test

fix_bamba_test

fix_check_copies

fix_chinese_clip

fix_convert_spm_bpe

fix_deprecation_warnings

fix_dinat_2

fix_dinov2

fix_docker_autoawq

fix_docker_autogptq_from_source

fix_doctest

fix_doctest_based_on_refactor_doctest_2

fix_eetq_test

fix_falcon_processor

fix_flaky_4

fix_flaky_test_assisted_decoding_matches_greedy_search

fix_flaky_test_pt_tf_model_equivalence

fix_fp_32

fix_generate_embeds

fix_gptq_test

fix_gptq_tests

fix_jetmoe

fix_more_input_out

fix_not_init

fix_peft_model_in_pipelines

fix_pipe_tests_001

fix_quanto_llama27b

fix_remote_tool

fix_slow_gen_on_0ae789e0

fix_slow_gen_on_75bbfd5b

fix_slow_gen_on_b6eb708b

fix_st5_docs

fix_stupid_cond

fix_test_encode_decode

fix_test_fetcher_tests

fix_tie

fix_whisper_ci

fix_whisper_tflite_export

fix_zh_quicktour_md

flex_attention_qwen2

flex_attn_example

for_test_run_squad_no_trainer

force-convert

full-bf16-train

full_length_on_468f7cca

full_length_on_68b71c85

full_length_on_862cde4c

gemma_allow_compile

general_test_low_cpu_mem

get_bad_commits_for_daily_ci_11_20

get_bad_commits_for_daily_ci_11_26

gpt-flex-attention

gpt-mqa

gptneo_gpt4_port

gptneo_gpt4_port_new

hardware-auto-setup

hardware-auto-setup-ci

hotfix_ci_222

hqq_serialization

idefics3

ifix_aqlm_modules_to_not_convert

improve_error_message_asr_pipeline

improve_error_message_when_transformers_is_misconfigured

improve_torch_version_check

informative-detr-message

init_round_2

init_round_5

int

inverse_chat_templates

jeffboudier-transformers-docs-ad-copy

jnp_devicearray

keras-core-support

keras3_compatibility_phase_2

keras_3_compatibility

larger_runner

less-constraints

link-to-the-hub

llama-break-fix

llama-pad-side

llama-refactor

load_pretrainedfast_auto

make-cache-traceable

mark_whisper_test_slow

master

measure_all_tests

measure_gen

measure_gen_on_0ae789e0

measure_gen_on_75bbfd5b

measure_gen_on_b6eb708b

merge_text2text_into_text_generation

ministral

mitigate_tf_stride_vulnerability

modular-roberta

modular-stablelm

more_reduced_dummy_memory_usage

more_tf_int_dtypes

moshi-integration

move_jobs_from_daily_ci_channel

move_part_2

muellerzr-accum-plugin

muellerzr-ds-investigation

muellerzr-dummy-pr

muellerzr-enable-quant

muellerzr-enable-torchdata

muellerzr-fix-autocast

muellerzr-fix-integration-tests

muellerzr-fix-reentrant

muellerzr-fix-timeout

muellerzr-free-memory

muellerzr-free-memory-passthrough

muellerzr-jobs

muellerzr-less-fixes

muellerzr-lr-sched-right-version

muellerzr-metrics

muellerzr-modeling

muellerzr-more-ga-tests-fast

muellerzr-more-models-sadface

muellerzr-multinode-save

muellerzr-network-retry

muellerzr-skip-dvc

muellerzr-skip-failing-example

muellerzr-speedup-modular-conversion

muellerzr-trainer-refactor

muellerzr-transformers-should-not-set-env-variables

muellerzr-use-scientific

mymain

new-split

nezha_slow

nit-ga-condition

nit-modular-reame

nit-refactor

nit-remove-irrelevant-comment

nit_cleanup

nits-attention

no_more_shape_list

no_overwrite_test_batching_equivalence

noua/bloom_cugraph

np2

on_predict

onnx_gpt2_io_definition

output_ragged

pin-ffspec

pin-gguf

pin_ds

ping_author

ping_author_6

pipeline-revision-mirror

pipelines_signatures

pixtral_batchmixfeature_fix

pixtral_processor_structure_fix

post-action-build-test-tokenizers-main

processor-template-duplicated-tokens

protobuf-4

push-ci-image

quickfix_generate_tests

reenable_test

refactor-attention-converesion

refactor-from-pretrained

refactor_doctest_2

refactoring-new-version

relative-paths

remove-cache-migration-script

remove-items

remove-torch-pre-releases-amd-image

remove-warnings

repro-bug-pytorch-compile

repro-bug-pytorch-compile-cudagraph

reset_logger_level_2

resnet_with_variants

reverse_templating

revert-17547-update-support-image

revert-17646-skip_repo_not_found

revert-31494-add_dac

revert-33934-patch-1

revert-checkpoint-tmp-dir

revert-commit-30302

revert_hard_error2

robust_config_ckpt_check

run-amd

run-fix-Parameter-init

run-move-integrations

run_add_tts_pip

run_amd_push_ci_caller

run_amd_scheduled_ci_caller

run_amd_scheduled_ci_caller_testing

run_amd_scheduled_ci_caller_testing1

run_better_job_artifact_name

run_better_report

run_bon_courage

run_check_auto_mapping_importable

run_check_natten

run_ci_manually

run_daily_ci

run_daily_ci_11_20

run_daily_ci_11_21

run_deepspeed_ci

run_doctest_after_merge

run_doctest_ci

run_ds_ci

run_fc639143

run_fc639143_001

run_fc639143_002

run_fc639143_003

run_feat/kv_cache_class

run_fix_doc_on_circleci

run_fix_error_not_captured

run_nightly_ci_test_new_runner

run_no_job_name

run_past_ci_2nd

run_refactor_doctest

run_run_all_tests

run_run_amd_scheduled_ci_caller_deepspeed_test

run_scheduled_ci_now

run_scheduled_ci_now_2

run_scheduled_ci_now_3

run_scheduled_ci_now_4

run_scheduled_ci_now_5

run_scheduled_ci_now_6

run_sep_model_and_other_no_model_n_8_all_models

run_show_failure_better

run_split_daily_ci_based_on_no_job_name

run_split_daily_ci_based_on_no_job_name_2

run_tiny_with_fix_tiny_model_creation

run_torch_v_2_1

run_trigger_ci_when_tiny_summary_modified

run_truncate

run_update_tiny_002

run_use_main_in_conversion_script

safe_ci_report

safe_serialization_always_valid

safetensors-0.4.2

safetensors-step-2-2

safetensors_pre_release

safetensors_rc

scale

secure-amd-ci

shieh-length_in_compile

show_failure

simplify

simplify-contributions-init

simplify-contributions-inits

simplify-contributions-main-init

simplify-contributions-model_init

skip-tokenizer-test

skip_2_hub_tests

skip_blip2_torchscript

skip_idefics_doctest

sliding-window

smangrul/fix-auto-batch-finder-trainer-issue

smangrul/integrate-accelerate

smangrul/starcoder-int4-ddp-flash-attn

split_daily_ci

spmconverter_user_symbols

ssh_new_cluster

starcoder-2-fix

stas00-patch-1

state_spaces_call_for_contribution

stop-ci-on-fail-doc

stop-throwing-cache-warning

support-copy

sync-table-question-answering

sync_dqa_pipeline

sync_token_classification_and_zero_shot

sync_vqa_pipeline

t5-fp16-no-nans

temp-disable-scheduled-amd-ci

temp-kosmos25

temporary_pin_torch_2

tensor-cache

test-bin-format

test-build-ci-uv

test-datasets-2.14

test-datasets-2.21

test-datasets-3.0

test-datasets-main

test-datasets-pr

test-deepseek-fp8

test-doctests

test-eetq-dockerfile

test-fa2

test-huggingface_hub-pre-release

test-new-doc-builder-workflow

test-seentok

test-tokenizer-release

test-tokenizers-main

test_bc_tokenizers

test_ci

test_composition_2

test_composition_lysandre

test_composition_remote_tool

test_doc

test_docker_run_quantization

test_if_token

test_release_candidates

test_run_scheduler_ci

test_safetensors

test_safetensors_0.5.0

test_safetensors_abi3

test_tokenizers_0.19.0rc0

test_tokenizers_abi3

tf_forced_logits_xla_compatible

tf_int64_tests

tf_llama_port

tf_new_dummy_building

tf_quicktour_fix

tfconvnext

thomas/accelerate_gpt2

thomas/accelerate_gptj

thomas/add_custom_kernels

thomas/bloom_allow_fp32_lm_head

thomas/dirty_bloom_tp

thomas/fix_bloom

thomas/improve_bloom_generation_speed

thomas/llama

thomas/make_tp_bloom_generate_work

thomas/make_tp_work_with_bloom

tied_weights_load

tied_weights_warning_check

timm_wrapper_kwargs

tok-update

tokenizer-release

tokenizers_rc1

tools-inference-endpoints

torch-2.2-on-daily-ci

torch_versions

tp-loading

tp-support

trad_fixes

trainer-hyperparameter-search-kwargs-docs-update

trigger-amd-image-build

trigger_ci_with_torch_2_4

trigger_daily_ci

trigger_debug

trigger_disable_multi_gpu

trigger_doc

trigger_pt_10_past_ci

trigger_run_amd_scheduled_ci_caller_deepspeed_test

trigger_slow

trigger_test_cached_model_has_minimum_calls_to_head

trigger_upload_artifacts_3

try_comment_bot

try_fix_whisper_slow_test

try_matrix_fail

try_new_natten

try_new_natten_2

try_pydantic_v2_build_images

try_run_amd_push_ci_caller

try_sub

update-add-new-model

update-cooki

update-doc-gpu

update-from-pretrained

update-quantization-docker

update-special-tokens

update-tokenizers-version

update_27265

update_kosmos_2_file

update_llama_template

update_ssh

upgrade_tokenizers2

use-hfh-loading-saving-state-dict-helpers

use-process-retry-on-amd-smi

use-safetensors-from-pr

use-uv-

use_pt_25_image

v3.5.1hotfix

v4.0.0-release

v4.0.1-release

v4.10.0

v4.10.0-release

v4.10.1-release

v4.10.2-release

v4.10.3-release

v4.12.1-release

v4.12.2-release

v4.12.3-release

v4.12.4-release

v4.12.5-release

v4.14.1-release

v4.16.1-release

v4.16.2-release

v4.17.0-release

v4.18-release

v4.19-release

v4.2.1-patch

v4.2.2-patch

v4.20-release

v4.21-release

v4.22-release

v4.23-release

v4.24-release

v4.25-release

v4.26-release

v4.27-release

v4.28-release

v4.29-release

v4.3.0-release

v4.3.1-release

v4.3.2-release

v4.3.3-release

v4.30-release

v4.31-release

v4.32-release

v4.33-release

v4.34-release

v4.35-release

v4.36-release

v4.37-release

v4.38-release

v4.39-release

v4.4.2-release

v4.40-release

v4.41-release

v4.42-release

v4.43-release

v4.44-release

v4.45-release

v4.46-release

v4.47-release

v4.48-release

v4.5.0-release

v4.5.1-release

v4.6.0-release

v4.8.0-release

v4.8.2-release

v4.9.1

v4.9.2-release

warn-pre-allocation

whisper_chunking

whisper_out_of_range

wip_test_safetensors_rc

xenova-patch-1

xla_concrete_fn_dynamic_shape_debug

ydshieh-push-ci-image

ydshieh_check_run_nightly_ci_test_new_runner

yih-dar-try-compile_models

younes-opt-350-m

younes-test-workflow

younesbelkada-patch-1

zach-accelerate-integration

0.1.2

0.5.0

1.0

1.1.0

1.2.0

3.0.1

4.3.0.rc1

list

localattn1

v0.1.2

v0.2.0

v0.3.0

v0.4.0

v0.5.0

v0.5.1

v0.6.0

v0.6.1

v0.6.2

v1.0.0

v2.0.0

v2.1.0

v2.1.1

v2.10.0

v2.11.0

v2.2.0

v2.2.1

v2.2.2

v2.3.0

v2.4.0

v2.4.1

v2.5.0

v2.5.1

v2.6.0

v2.7.0

v2.8.0

v2.9.0

v2.9.1

v3.0.0

v3.0.1

v3.0.2

v3.1.0

v3.2.0

v3.3.0

v3.3.1

v3.4.0

v3.5.0

v3.5.1

v4.0.0

v4.0.0-rc-1

v4.0.1

v4.1.0

v4.1.1

v4.10.0

v4.10.1

v4.10.2

v4.10.3

v4.11.0

v4.11.1

v4.11.2

v4.11.3

v4.12.0

v4.12.1

v4.12.2

v4.12.3

v4.12.4

v4.12.5

v4.13.0

v4.14.0

v4.14.1

v4.15.0

v4.16.0

v4.16.1

v4.16.2

v4.17.0

v4.18.0

v4.19.0

v4.19.1

v4.19.2

v4.19.3

v4.19.4

v4.2.0

v4.2.1

v4.2.2

v4.20.0

v4.20.1

v4.21.0

v4.21.1

v4.21.2

v4.21.3

v4.22.0

v4.22.1

v4.22.2

v4.23.0

v4.23.1

v4.24.0

v4.25.1

v4.26.0

v4.26.1

v4.27.0

v4.27.1

v4.27.2

v4.27.3

v4.27.4

v4.28.0

v4.28.1

v4.29.0

v4.29.1

v4.29.2

v4.3.0

v4.3.0.rc1

v4.3.1

v4.3.2

v4.3.3

v4.30.0

v4.30.1

v4.30.2

v4.31.0

v4.32.0

v4.32.1

v4.33.0

v4.33.1

v4.33.2

v4.33.3

v4.34.0

v4.34.1

v4.35.0

v4.35.1

v4.35.2

v4.36.0

v4.36.1

v4.36.2

v4.37.0

v4.37.1

v4.37.2

v4.38.0

v4.38.1

v4.38.2

v4.39.0

v4.39.1

v4.39.2

v4.39.3

v4.4.0

v4.4.1

v4.4.2

v4.40.0

v4.40.1

v4.40.2

v4.41.0

v4.41.1

v4.41.2

v4.42.0

v4.42.1

v4.42.2

v4.42.3

v4.42.4

v4.43.0

v4.43.1

v4.43.2

v4.43.3

v4.43.4

v4.44.0

v4.44.1

v4.44.2

v4.45.0

v4.45.1

v4.45.2

v4.46.0

v4.46.1

v4.46.2

v4.46.3

v4.47.0

v4.47.1

v4.48.0

v4.48.1

v4.48.2

v4.48.3

v4.5.0

v4.5.1

v4.6.0

v4.6.1

v4.7.0

v4.8.0

v4.8.1

v4.8.2

v4.9.0

v4.9.1

v4.9.2

7a911efddf update Arthur Zucker 2024-12-11 17:39:40 +0100
10e2fb75c1 Add retry torch decorator [[ -z $EMAIL ]] && read -e -p "Enter your email (for git configuration): " EMAIL 2024-12-11 11:34:13 -0500
89d32d6825 fix auto set Arthur Zucker 2024-12-11 17:30:26 +0100
3bbae39539 remove tanh Arthur Zucker 2024-12-11 17:24:56 +0100
e5d60b4f23 fix Arthur Zucker 2024-12-11 17:07:20 +0100
4b9a429a1c style Arthur Zucker 2024-12-11 16:54:35 +0100
1ef18f49a9 style Arthur Zucker 2024-12-11 16:53:02 +0100
28829d2dd6 there was an issue with tie weight keys Arthur Zucker 2024-12-11 16:44:04 +0100
40154815cb revert some stuff Arthur Zucker 2024-12-11 16:23:18 +0100
38dd294dd7 fix Arthur Zucker 2024-12-11 16:10:40 +0100
1baabd3207 update Arthur Zucker 2024-12-11 15:13:39 +0100
dcf7a37ce1 cache concatenates on the wrong axis Arthur Zucker 2024-12-11 14:38:26 +0100
f61a5fec41 pass attention Arthur Zucker 2024-12-11 14:37:12 +0100
556aa4ec2d updates Arthur Zucker 2024-12-11 14:35:53 +0100
341b8ce9fa nits Arthur Zucker 2024-12-11 14:27:20 +0100
56c1b1fbef Round 4 init_round_2 Lysandre 2024-12-11 14:20:48 +0100
0418f97553 make auto for causal lm work Arthur Zucker 2024-12-11 14:18:41 +0100
39ab8b757b oupts Arthur Zucker 2024-12-11 13:58:09 +0100
13a195a7bb _output_embedding and _input_embeding Arthur Zucker 2024-12-11 13:53:35 +0100
893ef382c4 nits Arthur Zucker 2024-12-11 13:47:59 +0100
4e681b9c72 nits Arthur Zucker 2024-12-11 13:38:19 +0100
0384db9c0c more refactoring Arthur Zucker 2024-12-11 12:39:07 +0100
f446bd4c00 only change lLlama Arthur Zucker 2024-12-11 12:20:51 +0100
bf5d7c3fa3 Only import torch.distributed if it is available (#35133) Gaétan Lepage 2024-12-10 18:19:30 +0100
8c269a0072 test datasets@main test-datasets-main Quentin Lhoest 2023-07-24 12:16:00 +0200
a319d9cd10

Merge branch 'main' into flex_attention_qwen2 flex_attention_qwen2 Mohamed Mekkouri 2024-12-10 16:36:07 +0100
93a233e82c add_dtype_check check_quantized_param_bnb4 MekkCyber 2024-12-10 15:07:17 +0000
49952300bb v4.47.1 Arthur Zucker 2024-12-10 08:41:52 +0100
d5ccfcc39a Fix num_items_in_batch not being an integer (#35115) Spiros Dontas 2024-12-10 09:40:40 +0200
c8ed11a277

draft to test dduf compatibility with file explorer dduf-compatibility-with-file-explorer Wauplin 2024-12-09 18:09:07 +0100
48833071c0 temporary solution to handle saving file from dduf format Marc Sun 2024-12-09 15:20:48 +0000
0485b6e881 Fix GA loss bugs and add unit test (#35121) kang sheng 2024-12-09 16:57:41 +0800
f2c402aa49 fix style ifix_aqlm_modules_to_not_convert MekkCyber 2024-12-09 09:05:49 +0000
93fb98d927 use models_to_not_convert MekkCyber 2024-12-09 09:01:37 +0000
ebad35797f fixing_qwen2moe MekkCyber 2024-12-08 22:41:36 +0000
32ed852df0 add_flexattention_qwen MekkCyber 2024-12-08 21:46:53 +0000
734a186fd2 fix a few issues Marc Sun 2024-12-06 16:31:51 +0000
9a841add0a fix ydshieh 2024-12-06 17:13:32 +0100
6ed504dbce fix ydshieh 2024-12-06 16:19:28 +0100
6054220b77 Revert deletion of self-push-amd.yml for now run_amd_scheduled_ci_caller_testing1 Ivar Flakstad 2024-12-06 16:02:47 +0100
925e14a0f5

Merge branch 'main' into main Yih-Dar 2024-12-06 15:30:02 +0100
943231a1ff fix adapter path in case we have peft installed Marc Sun 2024-12-06 13:42:45 +0100
4866c7ba49 use mmap instead Marc Sun 2024-12-06 12:35:52 +0000
0b9e5adaa0 Merge branch 'main' into kosmos25 ydshieh 2024-12-06 10:42:13 +0100
f6b4b5754b nit nit-ga-condition Arthur Zucker 2024-12-06 13:11:58 +0530
e7af32f234 fix fix_flaky_test_pt_tf_model_equivalence ydshieh 2024-12-06 06:25:03 +0100
723b9e2d3a fix ydshieh 2024-12-05 21:39:39 +0100
36d404f373 fix ydshieh 2024-12-05 21:27:49 +0100
f3ff530a45 [run-slow] pixtral pixtral_processor_structure_fix Matt 2024-12-05 18:45:21 +0000
6769700a16 Correct nesting in test Matt 2024-12-05 18:41:21 +0000
af9f67c9d9 Correct nesting in test Matt 2024-12-05 18:40:35 +0000
3406432db3 More error handling Matt 2024-12-05 18:36:06 +0000
031fdd5e10 make fixup Matt 2024-12-05 18:32:42 +0000
ed0b4303e3 Fix the structure of images output by the processor Matt 2024-12-05 18:31:08 +0000
49055e150d Fix the structure of images output by the processor Matt 2024-12-05 18:19:10 +0000
8e07742afa Comment on processor test pixtral_batchmixfeature_fix Matt 2024-12-05 17:50:04 +0000
31858be2c0 No more unsqueezing Matt 2024-12-04 18:33:57 +0000
d9f165af99 [run-slow] pixtral Matt 2024-12-03 18:23:39 +0000
c0515cebcd Add test Matt 2024-12-03 18:08:38 +0000
9cd45c8b48 Correctly pass device arg during recursion Matt 2024-12-03 18:07:28 +0000
0837c7e442 make fixup Matt 2024-12-03 17:54:46 +0000
8041515fd7 Fix incorrectly inserted device arg Matt 2024-12-03 17:54:31 +0000
7158f7488f make fixup Matt 2024-12-03 17:52:06 +0000
19876ea405 Fix case of nested tensors in BatchMixFeature Matt 2024-12-03 17:49:47 +0000
ab0f65f05d switch to huggingface hub api Marc Sun 2024-12-05 17:53:23 +0000
5d7739f15a Release: v4.47.0 v4.47.0 Lysandre 2024-12-05 18:17:54 +0100
2a9383853d

Merge branch 'main' into secure-amd-ci ivarflakstad 2024-12-05 18:08:18 +0100
8ee5e2ff6e dduf compat for models and clip + t5 tokenizer Marc Sun 2024-12-04 21:23:46 +0000
a1c0f64b93 fixing_falcon_processor MekkCyber 2024-12-04 15:27:58 +0000
32b371863f Use hf-workflows for both push and scheduled AMD CI Ivar Flakstad 2024-12-04 13:35:23 +0100
d38ed44e9d Use AMD CI workflow defined in hf-workflows Ivar Flakstad 2024-12-03 14:22:04 +0100
4829e47952 Late-night bugfix on financial RL environment (transformers) master saymrwulf 2024-12-01 21:20:00 +0100
315624af07 Trying out boneh-franklin approach for IBE (ref. 2003 paper) (transformers) saymrwulf 2024-12-01 03:32:00 +0100
7b139842c7 Implementing approach from a new paper read last night (transformers) saymrwulf 2024-12-01 08:00:00 +0100
a491b27690 Quick fix, referencing a known issue from the official repo (transformers) saymrwulf 2024-11-29 22:50:00 +0100
5139db5e0c fix fix_flaky_test_assisted_decoding_matches_greedy_search ydshieh 2024-11-29 18:12:14 +0100
640897d330 fix ydshieh 2024-11-29 18:04:50 +0100
e1161f20d1 fix ydshieh 2024-11-29 18:03:22 +0100
5ec58969ee fix ydshieh 2024-11-29 18:02:33 +0100
c380280ab0 fix ydshieh 2024-11-29 16:55:29 +0100
d37c8fb890 fix ydshieh 2024-11-29 15:55:07 +0100
c40a12e3b8 fix ydshieh 2024-11-29 14:46:16 +0100
8d9e49a113 fix ydshieh 2024-11-29 13:24:19 +0100
8206e06e5b [push-ci-image] push-ci-image Pavel Iakubovskii 2024-11-29 12:06:34 +0000
7662fb9b9a fix ydshieh 2024-11-29 13:00:19 +0100
68fe796209 fix ydshieh 2024-11-29 12:43:58 +0100
256d65101c fix ydshieh 2024-11-29 12:28:33 +0100
8cb6e9e079 fix ydshieh 2024-11-29 11:57:41 +0100
50d2e54675 fix ydshieh 2024-11-29 11:56:21 +0100
6f648cb7a0 fix ydshieh 2024-11-29 11:35:08 +0100
c8f5658b5a fix ydshieh 2024-11-29 11:21:32 +0100
a37afef202 fix ydshieh 2024-11-29 10:46:20 +0100
61422b7f26 fix ydshieh 2024-11-29 10:10:54 +0100
27fe21f27d fix ydshieh 2024-11-29 09:31:02 +0100
e60bb24d62 fix ydshieh 2024-11-29 09:08:53 +0100
48cd75bd47 Late-night bugfix on financial RL environment (transformers) saymrwulf 2024-11-29 07:12:00 +0100
f60f22b551 Implementing approach from a new paper read last night (transformers) saymrwulf 2024-11-29 02:49:00 +0100
9d664542e1 Testing bigger LLM config, referencing 'Attention Is All You Need' (transformers) saymrwulf 2024-11-29 22:54:00 +0100
44bc636fcc fix fix_flaky_4 ydshieh 2024-11-28 17:59:07 +0100
835669889d fix ydshieh 2024-11-28 17:52:49 +0100