huggingface
diff --git a/‎.gitignore‎
Lines changed: 1 addition & 0 deletions b/‎.gitignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎notebooks/en/_toctree.yml‎
Lines changed: 19 additions & 1 deletion b/‎notebooks/en/_toctree.yml‎
Lines changed: 19 additions & 1 deletion
diff --git a/‎notebooks/en/agent_data_analyst.ipynb‎
Lines changed: 3 additions & 3 deletions b/‎notebooks/en/agent_data_analyst.ipynb‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎notebooks/en/agent_rag.ipynb‎
Lines changed: 5 additions & 5 deletions b/‎notebooks/en/agent_rag.ipynb‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎notebooks/en/agent_text_to_sql.ipynb‎
Lines changed: 8 additions & 8 deletions b/‎notebooks/en/agent_text_to_sql.ipynb‎
Lines changed: 8 additions & 8 deletions
@@ -1,6 +1,7 @@
 .vscode
 .idea/
 .venv/
+.env
 
 **/.ipynb_checkpoints
 **/.DS_Store
@@ -54,6 +54,8 @@
           title: Building RAG with Custom Unstructured Data
         - local: fine_tuning_llm_to_generate_persian_product_catalogs_in_json_format
           title: Fine-tuning LLM to Generate Persian Product Catalogs in JSON Format
+        - local: finetune_t5_for_search_tag_generation
+          title: Fine-tuning T5 for Automatic GitHub Tag Generation with PEFT
         - local: llm_gateway_pii_detection
           title: LLM Gateway for PII Detection
         - local: information_extraction_haystack_nuextract
@@ -76,8 +78,18 @@
           title: Scaling Test-Time Compute for Longer Thinking in LLMs
         - local: fine_tuning_llm_grpo_trl
           title: Post training an LLM for reasoning with GRPO in TRL
-        - local: medical_rag_and_Reasoning
+        - local: trl_grpo_reasoning_advanced_reward
+          title: TRL GRPO Reasoning with Advanced Reward
+        - local: medical_rag_and_reasoning
           title: HuatuoGPT-o1 Medical RAG and Reasoning
+        - local: fine_tune_chatbot_docs_synthetic
+          title: Documentation Chatbot with Meta Synthetic Data Kit
+        - local: optuna_hpo_with_transformers
+          title: Hyperparameter Optimization with Optuna and Transformers
+        - local: function_calling_fine_tuning_llms_on_xlam
+          title: Fine-tuning LLMs for Function Calling with the xLAM Dataset
+          
+        
 
     - title: Computer Vision Recipes
       isExpanded: false
@@ -118,6 +130,12 @@
           title: Structured Generation from Images or Documents Using Vision Language Models
         - local: fine_tuning_granite_vision_sft_trl
           title: Fine-tuning Granite Vision with TRL
+        - local: fine_tuning_vlm_object_detection_grounding
+          title: Fine tuning a VLM for Object Detection Grounding using TRL
+        - local: fine_tuning_vlm_mpo
+          title: Fine-Tuning a Vision Language Model with TRL using MPO
+        - local: fine_tuning_vlm_grpo_trl
+          title: Post training an VLM for reasoning with GRPO using TRL
 
     - title: Search Recipes
       isExpanded: false
 
@@ -42,17 +42,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "from smolagents import HfApiModel, CodeAgent\n",
+    "from smolagents import InferenceClientModel, CodeAgent\n",
     "from huggingface_hub import login\n",
     "import os\n",
     "\n",
     "login(os.getenv(\"HUGGINGFACEHUB_API_TOKEN\"))\n",
     "\n",
-    "model = HfApiModel(\"meta-llama/Llama-3.1-70B-Instruct\")\n",
+    "model = InferenceClientModel(\"meta-llama/Llama-3.1-70B-Instruct\")\n",
     "\n",
     "agent = CodeAgent(\n",
     "    tools=[],\n",
 
@@ -219,7 +219,7 @@
     "- *`tools`*: a list of tools that the agent will be able to call.\n",
     "- *`model`*: the LLM that powers the agent.\n",
     "\n",
-    "Our `model` must be a callable that takes as input a list of [messages](https://huggingface.co/docs/transformers/main/chat_templating) and returns text. It also needs to accept a `stop_sequences` argument that indicates when to stop its generation. For convenience, we directly use the `HfApiModel` class provided in the package to get a LLM engine that calls our [Inference API](https://huggingface.co/docs/api-inference/en/index).\n",
+    "Our `model` must be a callable that takes as input a list of [messages](https://huggingface.co/docs/transformers/main/chat_templating) and returns text. It also needs to accept a `stop_sequences` argument that indicates when to stop its generation. For convenience, we directly use the `InferenceClientModel` class provided in the package to get a LLM engine that calls our [Inference API](https://huggingface.co/docs/api-inference/en/index).\n",
     "\n",
     "And we use [meta-llama/Llama-3.1-70B-Instruct](https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct), served for free on Hugging Face's Inference API!\n",
     "\n",
@@ -232,9 +232,9 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "from smolagents import HfApiModel, ToolCallingAgent\n",
+    "from smolagents import InferenceClientModel, ToolCallingAgent\n",
     "\n",
-    "model = HfApiModel(\"meta-llama/Llama-3.1-70B-Instruct\")\n",
+    "model = InferenceClientModel(\"meta-llama/Llama-3.1-70B-Instruct\")\n",
     "\n",
     "retriever_tool = RetrieverTool(vectordb)\n",
     "agent = ToolCallingAgent(\n",
@@ -263,15 +263,15 @@
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span> <span style=\"font-weight: bold\">How can I push a model to the Hub?</span>                                                                              <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
-       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ HfApiModel - meta-llama/Llama-3.1-70B-Instruct ────────────────────────────────────────────────────────────────╯</span>\n",
+       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ InferenceClientModel - meta-llama/Llama-3.1-70B-Instruct ────────────────────────────────────────────────────────────────╯</span>\n",
        "</pre>\n"
       ],
       "text/plain": [
        "\u001b[38;2;212;183;2m╭─\u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[1;38;2;212;183;2mNew run\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╮\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m \u001b[1mHow can I push a model to the Hub?\u001b[0m                                                                              \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
-       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m HfApiModel - meta-llama/Llama-3.1-70B-Instruct \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
+       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m InferenceClientModel - meta-llama/Llama-3.1-70B-Instruct \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
       ]
      },
      "metadata": {},
 
@@ -160,7 +160,7 @@
     "\n",
     "We use the `CodeAgent`, which is `transformers.agents`' main agent class: an agent that writes actions in code and can iterate on previous output according to the ReAct framework.\n",
     "\n",
-    "The `llm_engine` is the LLM that powers the agent system. `HfApiModel` allows you to call LLMs using Hugging Face's Inference API, either via Serverless or Dedicated endpoint, but you could also use any proprietary API: check out [this other cookbook](agent_change_llm) to learn how to adapt it."
+    "The `llm_engine` is the LLM that powers the agent system. `InferenceClientModel` allows you to call LLMs using Hugging Face's Inference API, either via Serverless or Dedicated endpoint, but you could also use any proprietary API: check out [this other cookbook](agent_change_llm) to learn how to adapt it."
    ]
   },
   {
@@ -169,11 +169,11 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "from smolagents import CodeAgent, HfApiModel\n",
+    "from smolagents import CodeAgent, InferenceClientModel\n",
     "\n",
     "agent = CodeAgent(\n",
     "    tools=[sql_engine],\n",
-    "    model=HfApiModel(\"meta-llama/Meta-Llama-3-8B-Instruct\"),\n",
+    "    model=InferenceClientModel(\"meta-llama/Meta-Llama-3-8B-Instruct\"),\n",
     ")"
    ]
   },
@@ -189,15 +189,15 @@
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span> <span style=\"font-weight: bold\">Can you give me the name of the client who got the most expensive receipt?</span>                                      <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
-       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ HfApiModel - meta-llama/Meta-Llama-3-8B-Instruct ──────────────────────────────────────────────────────────────╯</span>\n",
+       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ InferenceClientModel - meta-llama/Meta-Llama-3-8B-Instruct ──────────────────────────────────────────────────────────────╯</span>\n",
        "</pre>\n"
       ],
       "text/plain": [
        "\u001b[38;2;212;183;2m╭─\u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[1;38;2;212;183;2mNew run\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╮\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m \u001b[1mCan you give me the name of the client who got the most expensive receipt?\u001b[0m                                      \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
-       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m HfApiModel - meta-llama/Meta-Llama-3-8B-Instruct \u001b[0m\u001b[38;2;212;183;2m─────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
+       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m InferenceClientModel - meta-llama/Meta-Llama-3-8B-Instruct \u001b[0m\u001b[38;2;212;183;2m─────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
       ]
      },
      "metadata": {},
@@ -396,15 +396,15 @@
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span> <span style=\"font-weight: bold\">Which waiter got more total money from tips?</span>                                                                    <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
        "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>                                                                                                                 <span style=\"color: #d4b702; text-decoration-color: #d4b702\">│</span>\n",
-       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ HfApiModel - Qwen/Qwen2.5-72B-Instruct ────────────────────────────────────────────────────────────────────────╯</span>\n",
+       "<span style=\"color: #d4b702; text-decoration-color: #d4b702\">╰─ InferenceClientModel - Qwen/Qwen2.5-72B-Instruct ────────────────────────────────────────────────────────────────────────╯</span>\n",
        "</pre>\n"
       ],
       "text/plain": [
        "\u001b[38;2;212;183;2m╭─\u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[1;38;2;212;183;2mNew run\u001b[0m\u001b[38;2;212;183;2m \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╮\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m \u001b[1mWhich waiter got more total money from tips?\u001b[0m                                                                    \u001b[38;2;212;183;2m│\u001b[0m\n",
        "\u001b[38;2;212;183;2m│\u001b[0m                                                                                                                 \u001b[38;2;212;183;2m│\u001b[0m\n",
-       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m HfApiModel - Qwen/Qwen2.5-72B-Instruct \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
+       "\u001b[38;2;212;183;2m╰─\u001b[0m\u001b[38;2;212;183;2m InferenceClientModel - Qwen/Qwen2.5-72B-Instruct \u001b[0m\u001b[38;2;212;183;2m───────────────────────────────────────────────────────────────────────\u001b[0m\u001b[38;2;212;183;2m─╯\u001b[0m\n"
       ]
      },
      "metadata": {},
@@ -740,7 +740,7 @@
     "\n",
     "agent = CodeAgent(\n",
     "    tools=[sql_engine],\n",
-    "    model=HfApiModel(\"Qwen/Qwen2.5-72B-Instruct\"),\n",
+    "    model=InferenceClientModel(\"Qwen/Qwen2.5-72B-Instruct\"),\n",
     ")\n",
     "\n",
     "agent.run(\"Which waiter got more total money from tips?\")"
-Original file line number
+Diff line change
@@ @@ -1,6 +1,7 @@ @@
 .vscode
 .idea/
 .venv/
 +.env
 **/.ipynb_checkpoints
 **/.DS_Store