diff --git a/setup.py b/setup.py
index c04e6f732d5..3945537c49f 100644
--- a/setup.py
+++ b/setup.py
@@ -114,12 +114,12 @@ _deps = [
     "GitPython<3.1.19",
     "hf-doc-builder>=0.3.0",
     "hf_xet",
-    "huggingface-hub>=0.34.0,<1.0",
+    "huggingface-hub==1.0.0.rc1",
     "importlib_metadata",
     "ipadic>=1.0.0,<2.0",
     "jinja2>=3.1.0",
     "kenlm",
-    "kernels>=0.6.1,<=0.9",
+    "kernels>=0.10.2,<0.11",
     "librosa",
     "natten>=0.14.6,<0.15.0",
     "nltk<=3.8.1",
diff --git a/src/transformers/audio_utils.py b/src/transformers/audio_utils.py
index e2137bb1d1b..189c947fd19 100644
--- a/src/transformers/audio_utils.py
+++ b/src/transformers/audio_utils.py
@@ -25,11 +25,8 @@ from collections.abc import Sequence
 from io import BytesIO
 from typing import TYPE_CHECKING, Any, Optional, Union
 
-
-if TYPE_CHECKING:
-    import torch
+import httpx
 import numpy as np
-import requests
 from packaging import version
 
 from .utils import (
@@ -42,6 +39,9 @@ from .utils import (
 )
 
 
+if TYPE_CHECKING:
+    import torch
+
 if is_soundfile_available():
     import soundfile as sf
 
@@ -132,7 +132,9 @@ def load_audio_librosa(audio: Union[str, np.ndarray], sampling_rate=16000, timeo
 
     # Load audio from URL (e.g https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2-Audio/audio/translate_to_chinese.wav)
     if audio.startswith("http://") or audio.startswith("https://"):
-        audio = librosa.load(BytesIO(requests.get(audio, timeout=timeout).content), sr=sampling_rate)[0]
+        audio = librosa.load(
+            BytesIO(httpx.get(audio, follow_redirects=True, timeout=timeout).content), sr=sampling_rate
+        )[0]
     elif os.path.isfile(audio):
         audio = librosa.load(audio, sr=sampling_rate)[0]
     return audio
@@ -174,7 +176,7 @@ def load_audio_as(
         # Load audio bytes from URL or file
         audio_bytes = None
         if audio.startswith(("http://", "https://")):
-            response = requests.get(audio, timeout=timeout)
+            response = httpx.get(audio, follow_redirects=True, timeout=timeout)
             response.raise_for_status()
             audio_bytes = response.content
         elif os.path.isfile(audio):
diff --git a/src/transformers/dependency_versions_table.py b/src/transformers/dependency_versions_table.py
index bd1a34ee747..80b107d93c4 100644
--- a/src/transformers/dependency_versions_table.py
+++ b/src/transformers/dependency_versions_table.py
@@ -23,12 +23,12 @@ deps = {
     "GitPython": "GitPython<3.1.19",
     "hf-doc-builder": "hf-doc-builder>=0.3.0",
     "hf_xet": "hf_xet",
-    "huggingface-hub": "huggingface-hub>=0.34.0,<1.0",
+    "huggingface-hub": "huggingface-hub==1.0.0.rc1",
     "importlib_metadata": "importlib_metadata",
     "ipadic": "ipadic>=1.0.0,<2.0",
     "jinja2": "jinja2>=3.1.0",
     "kenlm": "kenlm",
-    "kernels": "kernels>=0.6.1,<=0.9",
+    "kernels": "kernels>=0.10.2,<0.11",
     "librosa": "librosa",
     "natten": "natten>=0.14.6,<0.15.0",
     "nltk": "nltk<=3.8.1",
diff --git a/src/transformers/file_utils.py b/src/transformers/file_utils.py
index 91d7974b55c..d1f456f9a71 100644
--- a/src/transformers/file_utils.py
+++ b/src/transformers/file_utils.py
@@ -17,9 +17,6 @@ File utilities: utilities related to download and cache models
 This module should not be update anymore and is only left for backward compatibility.
 """
 
-from huggingface_hub import get_full_repo_name  # for backward compatibility
-from huggingface_hub.constants import HF_HUB_DISABLE_TELEMETRY as DISABLE_TELEMETRY  # for backward compatibility
-
 from . import __version__
 
 # Backward compatibility imports, to make sure all those objects can be found in file_utils
diff --git a/src/transformers/image_utils.py b/src/transformers/image_utils.py
index ac3258da67b..d018174dd83 100644
--- a/src/transformers/image_utils.py
+++ b/src/transformers/image_utils.py
@@ -19,8 +19,8 @@ from dataclasses import dataclass
 from io import BytesIO
 from typing import Optional, Union
 
+import httpx
 import numpy as np
-import requests
 
 from .utils import (
     ExplicitEnum,
@@ -462,7 +462,7 @@ def load_image(image: Union[str, "PIL.Image.Image"], timeout: Optional[float] =
         if image.startswith("http://") or image.startswith("https://"):
             # We need to actually check for a real protocol, otherwise it's impossible to use a local file
             # like http_huggingface_co.png
-            image = PIL.Image.open(BytesIO(requests.get(image, timeout=timeout).content))
+            image = PIL.Image.open(BytesIO(httpx.get(image, timeout=timeout, follow_redirects=True).content))
         elif os.path.isfile(image):
             image = PIL.Image.open(image)
         else:
diff --git a/src/transformers/modelcard.py b/src/transformers/modelcard.py
index 8ba390ee7cf..9a9d8145d2a 100644
--- a/src/transformers/modelcard.py
+++ b/src/transformers/modelcard.py
@@ -21,7 +21,7 @@ from dataclasses import dataclass
 from pathlib import Path
 from typing import Any, Optional, Union
 
-import requests
+import httpx
 import yaml
 from huggingface_hub import model_info
 from huggingface_hub.errors import OfflineModeIsEnabled
@@ -380,12 +380,7 @@ class TrainingSummary:
                 for tag in info.tags:
                     if tag.startswith("license:"):
                         self.license = tag[8:]
-            except (
-                requests.exceptions.HTTPError,
-                requests.exceptions.ConnectionError,
-                HFValidationError,
-                OfflineModeIsEnabled,
-            ):
+            except (httpx.HTTPError, HFValidationError, OfflineModeIsEnabled):
                 pass
 
     def create_model_index(self, metric_mapping):
diff --git a/src/transformers/pipelines/audio_classification.py b/src/transformers/pipelines/audio_classification.py
index 58fb3ab4fca..86f0a95a51f 100644
--- a/src/transformers/pipelines/audio_classification.py
+++ b/src/transformers/pipelines/audio_classification.py
@@ -14,8 +14,8 @@
 import subprocess
 from typing import Any, Union
 
+import httpx
 import numpy as np
-import requests
 
 from ..utils import add_end_docstrings, is_torch_available, is_torchaudio_available, is_torchcodec_available, logging
 from .base import Pipeline, build_pipeline_init_args
@@ -168,7 +168,7 @@ class AudioClassificationPipeline(Pipeline):
             if inputs.startswith("http://") or inputs.startswith("https://"):
                 # We need to actually check for a real protocol, otherwise it's impossible to use a local file
                 # like http_huggingface_co.png
-                inputs = requests.get(inputs).content
+                inputs = httpx.get(inputs, follow_redirects=True).content
             else:
                 with open(inputs, "rb") as f:
                     inputs = f.read()
diff --git a/src/transformers/pipelines/automatic_speech_recognition.py b/src/transformers/pipelines/automatic_speech_recognition.py
index 960bc00f4c5..1f3c2152616 100644
--- a/src/transformers/pipelines/automatic_speech_recognition.py
+++ b/src/transformers/pipelines/automatic_speech_recognition.py
@@ -14,8 +14,8 @@
 from collections import defaultdict
 from typing import TYPE_CHECKING, Any, Optional, Union
 
+import httpx
 import numpy as np
-import requests
 
 from ..generation import GenerationConfig
 from ..tokenization_utils import PreTrainedTokenizer
@@ -355,7 +355,7 @@ class AutomaticSpeechRecognitionPipeline(ChunkPipeline):
             if inputs.startswith("http://") or inputs.startswith("https://"):
                 # We need to actually check for a real protocol, otherwise it's impossible to use a local file
                 # like http_huggingface_co.png
-                inputs = requests.get(inputs).content
+                inputs = httpx.get(inputs, follow_redirects=True).content
             else:
                 with open(inputs, "rb") as f:
                     inputs = f.read()
diff --git a/src/transformers/pipelines/image_to_image.py b/src/transformers/pipelines/image_to_image.py
index 094a511449d..957284d2ab1 100644
--- a/src/transformers/pipelines/image_to_image.py
+++ b/src/transformers/pipelines/image_to_image.py
@@ -46,12 +46,13 @@ class ImageToImagePipeline(Pipeline):
 
     ```python
     >>> from PIL import Image
-    >>> import requests
+    >>> import httpx
+    >>> import io
 
     >>> from transformers import pipeline
 
     >>> upscaler = pipeline("image-to-image", model="caidas/swin2SR-classical-sr-x2-64")
-    >>> img = Image.open(requests.get("http://images.cocodataset.org/val2017/000000039769.jpg", stream=True).raw)
+    >>> img = Image.open(io.BytesIO(httpx.get("http://images.cocodataset.org/val2017/000000039769.jpg").content))
     >>> img = img.resize((64, 64))
     >>> upscaled_img = upscaler(img)
     >>> img.size
diff --git a/src/transformers/pipelines/video_classification.py b/src/transformers/pipelines/video_classification.py
index ab57d46e7cc..e073d921e9e 100644
--- a/src/transformers/pipelines/video_classification.py
+++ b/src/transformers/pipelines/video_classification.py
@@ -15,7 +15,7 @@ import warnings
 from io import BytesIO
 from typing import Any, Optional, Union, overload
 
-import requests
+import httpx
 
 from ..utils import (
     add_end_docstrings,
@@ -142,7 +142,7 @@ class VideoClassificationPipeline(Pipeline):
             num_frames = self.model.config.num_frames
 
         if video.startswith("http://") or video.startswith("https://"):
-            video = BytesIO(requests.get(video).content)
+            video = BytesIO(httpx.get(video, follow_redirects=True).content)
 
         container = av.open(video)
 
diff --git a/src/transformers/pipelines/zero_shot_audio_classification.py b/src/transformers/pipelines/zero_shot_audio_classification.py
index fa9a2fe6ecf..7d5e36e5dd0 100644
--- a/src/transformers/pipelines/zero_shot_audio_classification.py
+++ b/src/transformers/pipelines/zero_shot_audio_classification.py
@@ -15,8 +15,8 @@
 from collections import UserDict
 from typing import Any, Union
 
+import httpx
 import numpy as np
-import requests
 
 from ..utils import (
     add_end_docstrings,
@@ -107,7 +107,7 @@ class ZeroShotAudioClassificationPipeline(Pipeline):
             if audio.startswith("http://") or audio.startswith("https://"):
                 # We need to actually check for a real protocol, otherwise it's impossible to use a local file
                 # like http_huggingface_co.png
-                audio = requests.get(audio).content
+                audio = httpx.get(audio, follow_redirects=True).content
             else:
                 with open(audio, "rb") as f:
                     audio = f.read()
diff --git a/src/transformers/safetensors_conversion.py b/src/transformers/safetensors_conversion.py
index f1612d3ea57..397240cadc9 100644
--- a/src/transformers/safetensors_conversion.py
+++ b/src/transformers/safetensors_conversion.py
@@ -1,6 +1,6 @@
 from typing import Optional
 
-import requests
+import httpx
 from huggingface_hub import Discussion, HfApi, get_repo_discussions
 
 from .utils import cached_file, http_user_agent, logging
@@ -44,10 +44,10 @@ def spawn_conversion(token: str, private: bool, model_id: str):
 
     data = {"data": [model_id, private, token]}
 
-    result = requests.post(sse_url, stream=True, json=data).json()
+    result = httpx.post(sse_url, follow_redirects=True, json=data).json()
     event_id = result["event_id"]
 
-    with requests.get(f"{sse_url}/{event_id}", stream=True) as sse_connection:
+    with httpx.stream("GET", f"{sse_url}/{event_id}") as sse_connection:
         try:
             logger.debug("Spawning safetensors automatic conversion.")
             start(sse_connection)
diff --git a/src/transformers/testing_utils.py b/src/transformers/testing_utils.py
index a7bbc8cd82f..304683b5f10 100644
--- a/src/transformers/testing_utils.py
+++ b/src/transformers/testing_utils.py
@@ -45,10 +45,9 @@ from typing import Any, Callable, Optional, Union
 from unittest import mock
 from unittest.mock import patch
 
-import huggingface_hub.utils
-import requests
+import httpx
 import urllib3
-from huggingface_hub import delete_repo
+from huggingface_hub import create_repo, delete_repo
 from packaging import version
 
 from transformers import Trainer
@@ -1848,7 +1847,7 @@ class TemporaryHubRepo:
             repo_id = Path(tmp_dir).name
             if namespace is not None:
                 repo_id = f"{namespace}/{repo_id}"
-            self.repo_url = huggingface_hub.create_repo(repo_id, token=self.token)
+            self.repo_url = create_repo(repo_id, token=self.token)
 
     def __enter__(self):
         return self.repo_url
@@ -2660,13 +2659,14 @@ def hub_retry(max_attempts: int = 5, wait_before_retry: Optional[float] = 2):
             while retry_count < max_attempts:
                 try:
                     return test_func_ref(*args, **kwargs)
-                # We catch all exceptions related to network issues from requests
+                # We catch all exceptions related to network issues from httpx
                 except (
-                    requests.exceptions.ConnectionError,
-                    requests.exceptions.Timeout,
-                    requests.exceptions.ReadTimeout,
-                    requests.exceptions.HTTPError,
-                    requests.exceptions.RequestException,
+                    httpx.HTTPError,
+                    httpx.RequestError,
+                    httpx.TimeoutException,
+                    httpx.ReadTimeout,
+                    httpx.ConnectError,
+                    httpx.NetworkError,
                 ) as err:
                     logger.error(
                         f"Test failed with {err} at try {retry_count}/{max_attempts} as it couldn't connect to the specified Hub repository."
diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py
index 0cd8fcf8cd1..76d36327b30 100755
--- a/src/transformers/trainer.py
+++ b/src/transformers/trainer.py
@@ -49,7 +49,7 @@ import huggingface_hub.utils as hf_hub_utils
 import numpy as np
 import torch
 import torch.distributed as dist
-from huggingface_hub import ModelCard, create_repo, upload_folder
+from huggingface_hub import CommitInfo, ModelCard, create_repo, upload_folder
 from packaging import version
 from torch import nn
 from torch.utils.data import DataLoader, Dataset, IterableDataset, RandomSampler, SequentialSampler
@@ -5117,7 +5117,7 @@ class Trainer:
         token: Optional[str] = None,
         revision: Optional[str] = None,
         **kwargs,
-    ) -> str:
+    ) -> CommitInfo:
         """
         Upload `self.model` and `self.processing_class` to the 🤗 model hub on the repo `self.args.hub_model_id`.
 
diff --git a/src/transformers/utils/__init__.py b/src/transformers/utils/__init__.py
index 70eed29f3a6..e6fb2104d06 100644
--- a/src/transformers/utils/__init__.py
+++ b/src/transformers/utils/__init__.py
@@ -16,8 +16,6 @@
 
 from functools import lru_cache
 
-from huggingface_hub import get_full_repo_name  # for backward compatibility
-from huggingface_hub.constants import HF_HUB_DISABLE_TELEMETRY as DISABLE_TELEMETRY  # for backward compatibility
 from packaging import version
 
 from .. import __version__
diff --git a/src/transformers/utils/attention_visualizer.py b/src/transformers/utils/attention_visualizer.py
index 2d0783ae2d4..4ddcbd021a6 100644
--- a/src/transformers/utils/attention_visualizer.py
+++ b/src/transformers/utils/attention_visualizer.py
@@ -11,9 +11,9 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
+import io
 
-
-import requests
+import httpx
 from PIL import Image
 
 from ..masking_utils import create_causal_mask
@@ -180,7 +180,7 @@ class AttentionMaskVisualizer:
         image_seq_length = None
         if self.config.model_type in PROCESSOR_MAPPING_NAMES:
             img = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/bee.jpg?download=true"
-            img = Image.open(requests.get(img, stream=True).raw)
+            img = Image.open(io.BytesIO(httpx.get(img, follow_redirects=True).content))
             image_seq_length = 5
             processor = AutoProcessor.from_pretrained(self.repo_id, image_seq_length=image_seq_length)
             if hasattr(processor, "image_token"):
diff --git a/src/transformers/utils/hub.py b/src/transformers/utils/hub.py
index d056fc0e877..3a30878d1e0 100644
--- a/src/transformers/utils/hub.py
+++ b/src/transformers/utils/hub.py
@@ -27,8 +27,8 @@ from typing import Optional, Union
 from urllib.parse import urlparse
 from uuid import uuid4
 
+import httpx
 import huggingface_hub
-import requests
 from huggingface_hub import (
     _CACHED_NO_EXIST,
     CommitOperationAdd,
@@ -58,7 +58,6 @@ from huggingface_hub.utils import (
     hf_raise_for_status,
     send_telemetry,
 )
-from requests.exceptions import HTTPError
 
 from . import __version__, logging
 from .generic import working_or_temp_dir
@@ -176,7 +175,7 @@ def list_repo_templates(
             ]
         except (GatedRepoError, RepositoryNotFoundError, RevisionNotFoundError):
             raise  # valid errors => do not catch
-        except (HTTPError, OfflineModeIsEnabled, requests.exceptions.ConnectionError):
+        except (HfHubHTTPError, OfflineModeIsEnabled, httpx.NetworkError):
             pass  # offline mode, internet down, etc. => try local files
 
     # check local files
@@ -199,7 +198,7 @@ def is_remote_url(url_or_filename):
 
 def define_sagemaker_information():
     try:
-        instance_data = requests.get(os.environ["ECS_CONTAINER_METADATA_URI"]).json()
+        instance_data = httpx.get(os.environ["ECS_CONTAINER_METADATA_URI"]).json()
         dlc_container_used = instance_data["Image"]
         dlc_tag = instance_data["Image"].split(":")[1]
     except Exception:
@@ -554,7 +553,7 @@ def cached_files(
                 ) from e
         # snapshot_download will not raise EntryNotFoundError, but hf_hub_download can. If this is the case, it will be treated
         # later on anyway and re-raised if needed
-        elif isinstance(e, HTTPError) and not isinstance(e, EntryNotFoundError):
+        elif isinstance(e, HfHubHTTPError) and not isinstance(e, EntryNotFoundError):
             if not _raise_exceptions_for_connection_errors:
                 return None
             raise OSError(f"There was a specific connection error when trying to load {path_or_repo_id}:\n{e}") from e
@@ -677,18 +676,13 @@ def has_file(
         response = get_session().head(
             hf_hub_url(path_or_repo, filename=filename, revision=revision, repo_type=repo_type),
             headers=build_hf_headers(token=token, user_agent=http_user_agent()),
-            allow_redirects=False,
-            proxies=proxies,
+            follow_redirects=False,
             timeout=10,
         )
-    except (requests.exceptions.SSLError, requests.exceptions.ProxyError):
+    except httpx.ProxyError:
         # Actually raise for those subclasses of ConnectionError
         raise
-    except (
-        requests.exceptions.ConnectionError,
-        requests.exceptions.Timeout,
-        OfflineModeIsEnabled,
-    ):
+    except (httpx.ConnectError, httpx.TimeoutException, OfflineModeIsEnabled):
         return has_file_in_cache
 
     try:
@@ -712,7 +706,7 @@ def has_file(
         ) from e
     except EntryNotFoundError:
         return False  # File does not exist
-    except requests.HTTPError:
+    except HfHubHTTPError:
         # Any authentication/authorization error will be caught here => default to cache
         return has_file_in_cache
 
diff --git a/src/transformers/video_utils.py b/src/transformers/video_utils.py
index 1ae8f59f9ae..30ad1f39f2c 100644
--- a/src/transformers/video_utils.py
+++ b/src/transformers/video_utils.py
@@ -22,8 +22,8 @@ from io import BytesIO
 from typing import Callable, NewType, Optional, Union
 from urllib.parse import urlparse
 
+import httpx
 import numpy as np
-import requests
 
 from .image_transforms import PaddingMode, to_channel_dimension_format
 from .image_utils import ChannelDimension, infer_channel_dimension_format, is_valid_image
@@ -683,7 +683,7 @@ def load_video(
         bytes_obj = buffer.getvalue()
         file_obj = BytesIO(bytes_obj)
     elif video.startswith("http://") or video.startswith("https://"):
-        file_obj = BytesIO(requests.get(video).content)
+        file_obj = BytesIO(httpx.get(video, follow_redirects=True).content)
     elif os.path.isfile(video):
         file_obj = video
     else:
diff --git a/tests/commands/test_serving.py b/tests/commands/test_serving.py
index 9fbd79464b1..e745dad3c88 100644
--- a/tests/commands/test_serving.py
+++ b/tests/commands/test_serving.py
@@ -19,7 +19,7 @@ from threading import Thread
 from unittest.mock import patch
 
 import aiohttp.client_exceptions
-import requests
+import httpx
 from huggingface_hub import AsyncInferenceClient, ChatCompletionStreamOutput
 from parameterized import parameterized
 
@@ -509,17 +509,18 @@ def _call_healthcheck(base_url: str):
     retries = 10
     while retries > 0:
         try:
-            response = requests.get(f"{base_url}/health")
+            response = httpx.get(f"{base_url}/health")
             break
-        except requests.exceptions.ConnectionError:
+        except httpx.NetworkError:
             time.sleep(0.1)
             retries -= 1
     return response
 
 
 def _open_stream_and_cancel(base_url: str, request_id: str):
-    with requests.Session() as s:
-        with s.post(
+    with httpx.Client() as s:
+        with s.stream(
+            "POST",
             f"{base_url}/v1/chat/completions",
             headers={"X-Request-ID": request_id},
             json={
@@ -527,13 +528,12 @@ def _open_stream_and_cancel(base_url: str, request_id: str):
                 "stream": True,
                 "messages": [{"role": "user", "content": "Count slowly so I can cancel you."}],
             },
-            stream=True,
             timeout=30,
         ) as resp:
             assert resp.status_code == 200
 
             wait_for_n_chunks = 3
-            for i, _ in enumerate(resp.iter_content(chunk_size=None)):
+            for i, _ in enumerate(resp.iter_bytes(chunk_size=None)):
                 if i >= wait_for_n_chunks:
                     resp.close()
                     break
diff --git a/tests/generation/test_configuration_utils.py b/tests/generation/test_configuration_utils.py
index bb4c2a52986..adfa1af09d5 100644
--- a/tests/generation/test_configuration_utils.py
+++ b/tests/generation/test_configuration_utils.py
@@ -19,7 +19,7 @@ import tempfile
 import unittest
 import warnings
 
-from huggingface_hub import HfFolder, create_pull_request
+from huggingface_hub import create_pull_request
 from parameterized import parameterized
 
 from transformers import AutoConfig, GenerationConfig, WatermarkingConfig, is_torch_available
@@ -688,7 +688,6 @@ class ConfigPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
diff --git a/tests/models/auto/test_modeling_auto.py b/tests/models/auto/test_modeling_auto.py
index 352df1fe7b5..9babbd42e05 100644
--- a/tests/models/auto/test_modeling_auto.py
+++ b/tests/models/auto/test_modeling_auto.py
@@ -13,9 +13,6 @@
 # limitations under the License.
 
 import copy
-import os
-import os.path
-import shutil
 import sys
 import tempfile
 import unittest
@@ -23,7 +20,6 @@ from collections import OrderedDict
 from pathlib import Path
 
 import pytest
-from huggingface_hub import Repository
 
 import transformers
 from transformers import BertConfig, GPT2Model, is_safetensors_available, is_torch_available
@@ -42,7 +38,6 @@ from ..bert.test_modeling_bert import BertModelTester
 sys.path.append(str(Path(__file__).parent.parent.parent.parent / "utils"))
 
 from test_module.custom_configuration import CustomConfig  # noqa E402
-from utils.fetch_hub_objects_for_ci import url_to_local_path
 
 
 if is_torch_available():
@@ -562,26 +557,6 @@ class AutoModelTest(unittest.TestCase):
         _MODEL_MAPPING = _LazyAutoMapping(_CONFIG_MAPPING_NAMES, _MODEL_MAPPING_NAMES)
         self.assertEqual(_MODEL_MAPPING[BertConfig], GPT2Model)
 
-    def test_dynamic_saving_from_local_repo(self):
-        with tempfile.TemporaryDirectory() as tmp_dir, tempfile.TemporaryDirectory() as tmp_dir_out:
-            # `Repository` is deprecated and will be removed in `huggingface_hub v1.0`.
-            # TODO: Remove this test when this comes.
-            # Here is a ugly approach to avoid `too many requests`
-            repo_id = url_to_local_path("hf-internal-testing/tiny-random-custom-architecture")
-            if os.path.isdir(repo_id):
-                shutil.copytree(repo_id, tmp_dir, dirs_exist_ok=True)
-            else:
-                _ = Repository(
-                    local_dir=tmp_dir,
-                    clone_from=url_to_local_path("hf-internal-testing/tiny-random-custom-architecture"),
-                )
-
-            model = AutoModelForCausalLM.from_pretrained(tmp_dir, trust_remote_code=True)
-            model.save_pretrained(tmp_dir_out)
-            _ = AutoModelForCausalLM.from_pretrained(tmp_dir_out, trust_remote_code=True)
-            self.assertTrue((Path(tmp_dir_out) / "modeling_fake_custom.py").is_file())
-            self.assertTrue((Path(tmp_dir_out) / "configuration_fake_custom.py").is_file())
-
     def test_custom_model_patched_generation_inheritance(self):
         """
         Tests that our inheritance patching for generate-compatible models works as expected. Without this feature,
diff --git a/tests/models/auto/test_processor_auto.py b/tests/models/auto/test_processor_auto.py
index 60500001a3b..6eabd690eed 100644
--- a/tests/models/auto/test_processor_auto.py
+++ b/tests/models/auto/test_processor_auto.py
@@ -20,7 +20,7 @@ import unittest
 from pathlib import Path
 from shutil import copyfile
 
-from huggingface_hub import HfFolder, Repository
+from huggingface_hub import snapshot_download, upload_folder
 
 import transformers
 from transformers import (
@@ -423,7 +423,6 @@ class ProcessorPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub_via_save_pretrained(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
@@ -471,7 +470,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
             processor = CustomProcessor(feature_extractor, tokenizer)
 
             with tempfile.TemporaryDirectory() as tmp_dir:
-                repo = Repository(tmp_dir, clone_from=tmp_repo, token=self._token)
+                snapshot_download(tmp_repo.repo_id, token=self._token)
                 processor.save_pretrained(tmp_dir)
 
                 # This has added the proper auto_map field to the feature extractor config
@@ -499,7 +498,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
                 self.assertTrue(os.path.isfile(os.path.join(tmp_dir, "custom_tokenization.py")))
                 self.assertTrue(os.path.isfile(os.path.join(tmp_dir, "custom_processing.py")))
 
-                repo.push_to_hub()
+                upload_folder(repo_id=tmp_repo.repo_id, folder_path=tmp_dir, token=self._token)
 
                 new_processor = AutoProcessor.from_pretrained(tmp_repo.repo_id, trust_remote_code=True)
                 # Can't make an isinstance check because the new_processor is from the CustomProcessor class of a dynamic module
diff --git a/tests/pipelines/test_pipelines_common.py b/tests/pipelines/test_pipelines_common.py
index aa3b1b55beb..eaf47ad8f52 100644
--- a/tests/pipelines/test_pipelines_common.py
+++ b/tests/pipelines/test_pipelines_common.py
@@ -21,8 +21,8 @@ import unittest
 from pathlib import Path
 
 import datasets
-from huggingface_hub import HfFolder, Repository, delete_repo
-from requests.exceptions import HTTPError
+from huggingface_hub import delete_repo, snapshot_download
+from huggingface_hub.errors import HfHubHTTPError
 
 from transformers import (
     AutomaticSpeechRecognitionPipeline,
@@ -209,7 +209,7 @@ class CommonPipelineTest(unittest.TestCase):
     @require_torch
     def test_auto_model_pipeline_registration_from_local_dir(self):
         with tempfile.TemporaryDirectory() as tmp_dir:
-            _ = Repository(local_dir=tmp_dir, clone_from="hf-internal-testing/tiny-random-custom-architecture")
+            snapshot_download("hf-internal-testing/tiny-random-custom-architecture", local_dir=tmp_dir)
             pipe = pipeline("text-generation", tmp_dir, trust_remote_code=True)
 
             self.assertIsInstance(pipe, TextGenerationPipeline)  # Assert successful load
@@ -874,13 +874,12 @@ class DynamicPipelineTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     @classmethod
     def tearDownClass(cls):
         try:
             delete_repo(token=cls._token, repo_id="test-dynamic-pipeline")
-        except HTTPError:
+        except HfHubHTTPError:
             pass
 
     @unittest.skip("Broken, TODO @Yih-Dar")
diff --git a/tests/pipelines/test_pipelines_image_segmentation.py b/tests/pipelines/test_pipelines_image_segmentation.py
index b1f0dd14057..c926dd004f3 100644
--- a/tests/pipelines/test_pipelines_image_segmentation.py
+++ b/tests/pipelines/test_pipelines_image_segmentation.py
@@ -11,13 +11,13 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+import io
 import tempfile
 import unittest
 
 import datasets
+import httpx
 import numpy as np
-import requests
 from datasets import load_dataset
 from huggingface_hub import ImageSegmentationOutputElement
 from huggingface_hub.utils import insecure_hashlib
@@ -318,7 +318,9 @@ class ImageSegmentationPipelineTests(unittest.TestCase):
         ]
         # actual links to get files
         expected_masks = [x.replace("/blob/", "/resolve/") for x in expected_masks]
-        expected_masks = [Image.open(requests.get(image, stream=True).raw) for image in expected_masks]
+        expected_masks = [
+            Image.open(io.BytesIO(httpx.get(image, follow_redirects=True).content)) for image in expected_masks
+        ]
 
         # Convert masks to numpy array
         output_masks = [np.array(x) for x in output_masks]
diff --git a/tests/pipelines/test_pipelines_image_to_text.py b/tests/pipelines/test_pipelines_image_to_text.py
index bc8ac76548e..5ba99695d65 100644
--- a/tests/pipelines/test_pipelines_image_to_text.py
+++ b/tests/pipelines/test_pipelines_image_to_text.py
@@ -11,10 +11,10 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
+import io
 import unittest
 
-import requests
+import httpx
 
 from transformers import MODEL_FOR_VISION_2_SEQ_MAPPING, is_vision_available
 from transformers.pipelines import ImageToTextPipeline, pipeline
@@ -172,7 +172,7 @@ class ImageToTextPipelineTests(unittest.TestCase):
     def test_generation_pt_blip(self):
         pipe = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
         url = "https://huggingface.co/datasets/sayakpaul/sample-datasets/resolve/main/pokemon.png"
-        image = Image.open(requests.get(url, stream=True).raw)
+        image = Image.open(io.BytesIO(httpx.get(url, follow_redirects=True).content))
 
         outputs = pipe(image)
         self.assertEqual(outputs, [{"generated_text": "a pink pokemon pokemon with a blue shirt and a blue shirt"}])
@@ -182,7 +182,7 @@ class ImageToTextPipelineTests(unittest.TestCase):
     def test_generation_pt_git(self):
         pipe = pipeline("image-to-text", model="microsoft/git-base-coco")
         url = "https://huggingface.co/datasets/sayakpaul/sample-datasets/resolve/main/pokemon.png"
-        image = Image.open(requests.get(url, stream=True).raw)
+        image = Image.open(io.BytesIO(httpx.get(url, follow_redirects=True).content))
 
         outputs = pipe(image)
         self.assertEqual(outputs, [{"generated_text": "a cartoon of a purple character."}])
@@ -192,7 +192,7 @@ class ImageToTextPipelineTests(unittest.TestCase):
     def test_conditional_generation_pt_blip(self):
         pipe = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
         url = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/transformers/tasks/ai2d-demo.jpg"
-        image = Image.open(requests.get(url, stream=True).raw)
+        image = Image.open(io.BytesIO(httpx.get(url, follow_redirects=True).content))
 
         prompt = "a photography of"
 
@@ -207,7 +207,7 @@ class ImageToTextPipelineTests(unittest.TestCase):
     def test_conditional_generation_pt_git(self):
         pipe = pipeline("image-to-text", model="microsoft/git-base-coco")
         url = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/transformers/tasks/ai2d-demo.jpg"
-        image = Image.open(requests.get(url, stream=True).raw)
+        image = Image.open(io.BytesIO(httpx.get(url, follow_redirects=True).content))
 
         prompt = "a photo of a"
 
@@ -222,7 +222,7 @@ class ImageToTextPipelineTests(unittest.TestCase):
     def test_conditional_generation_pt_pix2struct(self):
         pipe = pipeline("image-to-text", model="google/pix2struct-ai2d-base")
         url = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/transformers/tasks/ai2d-demo.jpg"
-        image = Image.open(requests.get(url, stream=True).raw)
+        image = Image.open(io.BytesIO(httpx.get(url, follow_redirects=True).content))
 
         prompt = "What does the label 15 represent? (1) lava (2) core (3) tunnel (4) ash cloud"
 
diff --git a/tests/test_image_processing_common.py b/tests/test_image_processing_common.py
index ce0bd4181be..e7c3daa1a38 100644
--- a/tests/test_image_processing_common.py
+++ b/tests/test_image_processing_common.py
@@ -11,8 +11,8 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-
 import inspect
+import io
 import json
 import os
 import pathlib
@@ -22,9 +22,9 @@ import unittest
 import warnings
 from copy import deepcopy
 
+import httpx
 import numpy as np
 import pytest
-import requests
 from packaging import version
 
 from transformers import AutoImageProcessor, BatchFeature
@@ -182,7 +182,9 @@ class ImageProcessingTestMixin:
             self.skipTest(reason="Skipping slow/fast equivalence test as one of the image processors is not defined")
 
         dummy_image = Image.open(
-            requests.get("http://images.cocodataset.org/val2017/000000039769.jpg", stream=True).raw
+            io.BytesIO(
+                httpx.get("http://images.cocodataset.org/val2017/000000039769.jpg", follow_redirects=True).content
+            )
         )
         image_processor_slow = self.image_processing_class(**self.image_processor_dict)
         image_processor_fast = self.fast_image_processing_class(**self.image_processor_dict)
diff --git a/tests/test_tokenization_mistral_common.py b/tests/test_tokenization_mistral_common.py
index 05b9ae636fb..e3408317758 100644
--- a/tests/test_tokenization_mistral_common.py
+++ b/tests/test_tokenization_mistral_common.py
@@ -34,7 +34,7 @@ if is_mistral_common_available():
     from mistral_common.tokens.tokenizers.mistral import MistralTokenizer
     from mistral_common.tokens.tokenizers.utils import list_local_hf_repo_files
 
-    # To avoid unnecessary `requests.get` calls which give us `Error: Too Many Requests for url` on CircleCI
+    # To avoid unnecessary `httpx.get` calls which give us `Error: Too Many Requests for url` on CircleCI
     mistral_common.tokens.tokenizers.image.download_image = load_image
 
 
diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py
index 29558f50bba..5cce980a6a0 100644
--- a/tests/trainer/test_trainer.py
+++ b/tests/trainer/test_trainer.py
@@ -32,7 +32,7 @@ from unittest.mock import Mock, patch
 
 import numpy as np
 import pytest
-from huggingface_hub import HfFolder, ModelCard, create_branch, list_repo_commits, list_repo_files
+from huggingface_hub import ModelCard, create_branch, list_repo_commits, list_repo_files
 from packaging import version
 from parameterized import parameterized
 
@@ -5284,7 +5284,6 @@ class TrainerIntegrationWithHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
@@ -5469,14 +5468,10 @@ class TrainerIntegrationWithHubTester(unittest.TestCase):
                 )
                 branch = "v1.0"
                 create_branch(repo_id=trainer.hub_model_id, branch=branch, token=self._token, exist_ok=True)
-                url = trainer.push_to_hub(revision=branch)
+                push_commit = trainer.push_to_hub(revision=branch)
 
-            # Extract branch from the url
-            re_search = re.search(r"tree/([^/]+)/", url)
-            self.assertIsNotNone(re_search)
-
-            branch_name = re_search.groups()[0]
-            self.assertEqual(branch_name, branch)
+            commits = list_repo_commits(repo_id=trainer.hub_model_id, revision=branch, token=self._token)
+            self.assertEqual(commits[0].commit_id, push_commit.oid)
 
 
 @require_torch
diff --git a/tests/utils/test_configuration_utils.py b/tests/utils/test_configuration_utils.py
index 50b5b11db1b..069ca6729bb 100644
--- a/tests/utils/test_configuration_utils.py
+++ b/tests/utils/test_configuration_utils.py
@@ -21,8 +21,7 @@ import unittest.mock as mock
 import warnings
 from pathlib import Path
 
-from huggingface_hub import HfFolder
-from requests.exceptions import HTTPError
+import httpx
 
 from transformers import AutoConfig, BertConfig, Florence2Config, GPT2Config
 from transformers.configuration_utils import PretrainedConfig
@@ -93,7 +92,6 @@ class ConfigPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
@@ -222,14 +220,16 @@ class ConfigTestUtils(unittest.TestCase):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
         _ = BertConfig.from_pretrained("hf-internal-testing/tiny-random-bert")
 
         # Under the mock environment we get a 500 error when trying to reach the model.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = BertConfig.from_pretrained("hf-internal-testing/tiny-random-bert")
             # This check we did call the fake head request
             mock_head.assert_called()
diff --git a/tests/utils/test_feature_extraction_utils.py b/tests/utils/test_feature_extraction_utils.py
index b3d8932e7cd..b0a6a193d10 100644
--- a/tests/utils/test_feature_extraction_utils.py
+++ b/tests/utils/test_feature_extraction_utils.py
@@ -19,8 +19,7 @@ import unittest
 import unittest.mock as mock
 from pathlib import Path
 
-from huggingface_hub import HfFolder
-from requests.exceptions import HTTPError
+import httpx
 
 from transformers import AutoFeatureExtractor, Wav2Vec2FeatureExtractor
 from transformers.testing_utils import TOKEN, TemporaryHubRepo, get_tests_dir, is_staging_test
@@ -40,13 +39,15 @@ class FeatureExtractorUtilTester(unittest.TestCase):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
         _ = Wav2Vec2FeatureExtractor.from_pretrained("hf-internal-testing/tiny-random-wav2vec2")
         # Under the mock environment we get a 500 error when trying to reach the model.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = Wav2Vec2FeatureExtractor.from_pretrained("hf-internal-testing/tiny-random-wav2vec2")
             # This check we did call the fake head request
             mock_head.assert_called()
@@ -57,7 +58,6 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
diff --git a/tests/utils/test_hub_utils.py b/tests/utils/test_hub_utils.py
index df3af3d97a8..a3423245a89 100644
--- a/tests/utils/test_hub_utils.py
+++ b/tests/utils/test_hub_utils.py
@@ -19,8 +19,7 @@ import unittest.mock as mock
 from pathlib import Path
 
 from huggingface_hub import hf_hub_download
-from huggingface_hub.errors import LocalEntryNotFoundError, OfflineModeIsEnabled
-from requests.exceptions import HTTPError
+from huggingface_hub.errors import HfHubHTTPError, LocalEntryNotFoundError, OfflineModeIsEnabled
 
 from transformers.utils import (
     CONFIG_NAME,
@@ -87,7 +86,10 @@ class GetFromCacheTests(unittest.TestCase):
         self.assertIsNone(path)
 
         # Under the mock environment, hf_hub_download will always raise an HTTPError
-        with mock.patch("transformers.utils.hub.hf_hub_download", side_effect=HTTPError) as mock_head:
+        with mock.patch(
+            "transformers.utils.hub.hf_hub_download",
+            side_effect=HfHubHTTPError("failed", response=mock.Mock(status_code=404)),
+        ) as mock_head:
             path = cached_file(RANDOM_BERT, "conf", _raise_exceptions_for_connection_errors=False)
             self.assertIsNone(path)
             # This check we did call the fake head request
diff --git a/tests/utils/test_image_processing_utils.py b/tests/utils/test_image_processing_utils.py
index ea8c06fa993..17e5e305c61 100644
--- a/tests/utils/test_image_processing_utils.py
+++ b/tests/utils/test_image_processing_utils.py
@@ -18,8 +18,7 @@ import unittest
 import unittest.mock as mock
 from pathlib import Path
 
-from huggingface_hub import HfFolder
-from requests.exceptions import HTTPError
+import httpx
 
 from transformers import AutoImageProcessor, ViTImageProcessor, ViTImageProcessorFast
 from transformers.image_processing_utils import get_size_dict
@@ -40,7 +39,9 @@ class ImageProcessorUtilTester(unittest.TestCase):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
@@ -48,7 +49,7 @@ class ImageProcessorUtilTester(unittest.TestCase):
         _ = ViTImageProcessorFast.from_pretrained("hf-internal-testing/tiny-random-vit")
 
         # Under the mock environment we get a 500 error when trying to reach the model.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = ViTImageProcessor.from_pretrained("hf-internal-testing/tiny-random-vit")
             _ = ViTImageProcessorFast.from_pretrained("hf-internal-testing/tiny-random-vit")
             # This check we did call the fake head request
@@ -71,7 +72,6 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
diff --git a/tests/utils/test_image_utils.py b/tests/utils/test_image_utils.py
index 8d124d361c2..6c2db861ffe 100644
--- a/tests/utils/test_image_utils.py
+++ b/tests/utils/test_image_utils.py
@@ -19,11 +19,10 @@ import unittest
 from io import BytesIO
 from typing import Optional
 
+import httpx
 import numpy as np
 import pytest
-import requests
 from huggingface_hub.file_download import hf_hub_url, http_get
-from requests import ConnectTimeout, ReadTimeout
 
 from tests.pipelines.test_pipelines_document_question_answering import INVOICE_URL
 from transformers import is_torch_available, is_vision_available
@@ -49,7 +48,7 @@ if is_vision_available():
 
 def get_image_from_hub_dataset(dataset_id: str, filename: str, revision: Optional[str] = None) -> "PIL.Image.Image":
     url = hf_hub_url(dataset_id, filename, repo_type="dataset", revision=revision)
-    return PIL.Image.open(BytesIO(requests.get(url).content))
+    return PIL.Image.open(BytesIO(httpx.get(url, follow_redirects=True).content))
 
 
 def get_random_image(height, width):
@@ -727,7 +726,7 @@ class LoadImageTester(unittest.TestCase):
 
     @is_flaky()
     def test_load_img_url_timeout(self):
-        with self.assertRaises((ReadTimeout, ConnectTimeout)):
+        with self.assertRaises(httpx.ConnectTimeout):
             load_image(INVOICE_URL, timeout=0.001)
 
     def test_load_img_local(self):
diff --git a/tests/utils/test_modeling_utils.py b/tests/utils/test_modeling_utils.py
index fc2bbb60c45..045f1104078 100644
--- a/tests/utils/test_modeling_utils.py
+++ b/tests/utils/test_modeling_utils.py
@@ -27,12 +27,11 @@ import uuid
 import warnings
 from pathlib import Path
 
+import httpx
 import pytest
-import requests
-from huggingface_hub import HfApi, HfFolder, split_torch_state_dict_into_shards
+from huggingface_hub import HfApi, split_torch_state_dict_into_shards
 from parameterized import parameterized
 from pytest import mark
-from requests.exceptions import HTTPError
 
 from transformers import (
     AutoConfig,
@@ -419,7 +418,7 @@ class ModelUtilsTest(TestCasePlus):
             # First attempt will fail with a connection error
             if not hasattr(test_func, "attempt"):
                 test_func.attempt = 1
-                raise requests.exceptions.ConnectionError("Connection failed")
+                raise httpx.ConnectError("Connection failed")
             # Second attempt will succeed
             return True
 
@@ -1172,14 +1171,16 @@ class ModelUtilsTest(TestCasePlus):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
         _ = BertModel.from_pretrained("hf-internal-testing/tiny-random-bert")
 
         # Under the mock environment we get a 500 error when trying to reach the model.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = BertModel.from_pretrained("hf-internal-testing/tiny-random-bert")
             # This check we did call the fake head request
             mock_head.assert_called()
@@ -2205,10 +2206,7 @@ class ModelOnTheFlyConversionTester(unittest.TestCase):
         initial_model = BertModel(config)
 
         initial_model.push_to_hub(self.repo_name, token=self.token, safe_serialization=False)
-        headers = {"Authorization": f"Bearer {self.token}"}
-        requests.put(
-            f"https://huggingface.co/api/models/{self.repo_name}/settings", json={"gated": "auto"}, headers=headers
-        )
+        self.api.update_repo_settings(self.repo_name, gated="auto")
         converted_model = BertModel.from_pretrained(self.repo_name, use_safetensors=True, token=self.token)
 
         with self.subTest("Initial and converted models are equal"):
@@ -2269,7 +2267,7 @@ class ModelOnTheFlyConversionTester(unittest.TestCase):
 
         initial_model.push_to_hub(self.repo_name, token=self.token, max_shard_size="200kb", safe_serialization=False)
         headers = {"Authorization": f"Bearer {self.token}"}
-        requests.put(
+        httpx.put(
             f"https://huggingface.co/api/models/{self.repo_name}/settings", json={"gated": "auto"}, headers=headers
         )
         converted_model = BertModel.from_pretrained(self.repo_name, use_safetensors=True, token=self.token)
@@ -2368,7 +2366,7 @@ class ModelOnTheFlyConversionTester(unittest.TestCase):
 
     @mock.patch("transformers.safetensors_conversion.spawn_conversion")
     def test_absence_of_safetensors_triggers_conversion_failed(self, spawn_conversion_mock):
-        spawn_conversion_mock.side_effect = HTTPError()
+        spawn_conversion_mock.side_effect = httpx.HTTPError("failed")
 
         config = BertConfig(
             vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
@@ -2388,7 +2386,6 @@ class ModelPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     @unittest.skip(reason="This test is flaky")
     def test_push_to_hub(self):
diff --git a/tests/utils/test_tokenization_utils.py b/tests/utils/test_tokenization_utils.py
index ff0f6499fe1..ecda49fd9bd 100644
--- a/tests/utils/test_tokenization_utils.py
+++ b/tests/utils/test_tokenization_utils.py
@@ -19,9 +19,8 @@ import unittest
 import unittest.mock as mock
 from pathlib import Path
 
-from huggingface_hub import HfFolder
+import httpx
 from huggingface_hub.file_download import http_get
-from requests.exceptions import HTTPError
 
 from transformers import (
     AlbertTokenizer,
@@ -50,14 +49,16 @@ class TokenizerUtilTester(unittest.TestCase):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
         _ = BertTokenizer.from_pretrained("hf-internal-testing/tiny-random-bert")
 
         # Under the mock environment we get a 500 error when trying to reach the tokenizer.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = BertTokenizer.from_pretrained("hf-internal-testing/tiny-random-bert")
             # This check we did call the fake head request
             mock_head.assert_called()
@@ -68,14 +69,16 @@ class TokenizerUtilTester(unittest.TestCase):
         response_mock = mock.Mock()
         response_mock.status_code = 500
         response_mock.headers = {}
-        response_mock.raise_for_status.side_effect = HTTPError
+        response_mock.raise_for_status.side_effect = httpx.HTTPStatusError(
+            "failed", request=mock.Mock(), response=mock.Mock()
+        )
         response_mock.json.return_value = {}
 
         # Download this model to make sure it's in the cache.
         _ = GPT2TokenizerFast.from_pretrained("openai-community/gpt2")
 
         # Under the mock environment we get a 500 error when trying to reach the tokenizer.
-        with mock.patch("requests.Session.request", return_value=response_mock) as mock_head:
+        with mock.patch("httpx.Client.request", return_value=response_mock) as mock_head:
             _ = GPT2TokenizerFast.from_pretrained("openai-community/gpt2")
             # This check we did call the fake head request
             mock_head.assert_called()
@@ -115,7 +118,6 @@ class TokenizerPushToHubTester(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         cls._token = TOKEN
-        HfFolder.save_token(TOKEN)
 
     def test_push_to_hub(self):
         with TemporaryHubRepo(token=self._token) as tmp_repo:
diff --git a/utils/create_dummy_models.py b/utils/create_dummy_models.py
index a561967fba1..1e5c67bb909 100644
--- a/utils/create_dummy_models.py
+++ b/utils/create_dummy_models.py
@@ -28,7 +28,7 @@ from pathlib import Path
 from check_config_docstrings import get_checkpoint_from_config_class
 from datasets import load_dataset
 from get_test_info import get_model_to_tester_mapping, get_tester_classes_for_model
-from huggingface_hub import Repository, create_repo, hf_api, upload_folder
+from huggingface_hub import Repository, create_repo, hf_api, upload_folder  # TODO: remove Repository
 
 from transformers import (
     CONFIG_MAPPING,
diff --git a/utils/fetch_hub_objects_for_ci.py b/utils/fetch_hub_objects_for_ci.py
index 349fd8ed58c..0f41ec344f5 100644
--- a/utils/fetch_hub_objects_for_ci.py
+++ b/utils/fetch_hub_objects_for_ci.py
@@ -1,7 +1,7 @@
 import os
 
 import requests
-from huggingface_hub import Repository, hf_hub_download
+from huggingface_hub import hf_hub_download, snapshot_download
 
 from transformers.testing_utils import _run_pipeline_tests, _run_staging
 from transformers.utils.import_utils import is_mistral_common_available
@@ -173,9 +173,9 @@ if __name__ == "__main__":
     # But this repo. is never used in a test decorated by `is_staging_test`.
     if not _run_staging:
         if not os.path.isdir("tiny-random-custom-architecture"):
-            _ = Repository(
+            snapshot_download(
+                "hf-internal-testing/tiny-random-custom-architecture",
                 local_dir="tiny-random-custom-architecture",
-                clone_from="hf-internal-testing/tiny-random-custom-architecture",
             )
 
         # For `tests/test_tokenization_mistral_common.py:TestMistralCommonTokenizer`, which eventually calls
diff --git a/utils/update_tiny_models.py b/utils/update_tiny_models.py
index ee81407d412..336770c540e 100644
--- a/utils/update_tiny_models.py
+++ b/utils/update_tiny_models.py
@@ -27,7 +27,7 @@ import os
 import time
 
 from create_dummy_models import COMPOSITE_MODELS, create_tiny_models
-from huggingface_hub import ModelFilter, hf_api
+from huggingface_hub import HfApi
 
 import transformers
 from transformers import AutoFeatureExtractor, AutoImageProcessor, AutoTokenizer
@@ -65,15 +65,12 @@ def get_tiny_model_names_from_repo():
 
 
 def get_tiny_model_summary_from_hub(output_path):
+    api = HfApi()
     special_models = COMPOSITE_MODELS.values()
 
     # All tiny model base names on Hub
     model_names = get_all_model_names()
-    models = hf_api.list_models(
-        filter=ModelFilter(
-            author="hf-internal-testing",
-        )
-    )
+    models = api.list_models(author="hf-internal-testing")
     _models = set()
     for x in models:
         model = x.id
@@ -94,7 +91,7 @@ def get_tiny_model_summary_from_hub(output_path):
         repo_id = f"hf-internal-testing/tiny-random-{model}"
         model = model.split("-")[0]
         try:
-            repo_info = hf_api.repo_info(repo_id)
+            repo_info = api.repo_info(repo_id)
             content = {
                 "tokenizer_classes": set(),
                 "processor_classes": set(),