huggingface
diff --git a/‎.github/pull_request_template.md
Lines changed: 1 addition & 1 deletion b/‎.github/pull_request_template.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎course/en/chapter1/section3.ipynb
Lines changed: 322 additions & 0 deletions b/‎course/en/chapter1/section3.ipynb
Lines changed: 322 additions & 0 deletions
diff --git a/‎course/en/chapter1/section8.ipynb
Lines changed: 63 additions & 0 deletions b/‎course/en/chapter1/section8.ipynb
Lines changed: 63 additions & 0 deletions
@@ -7,7 +7,7 @@ Someone will review your PR shortly (see the section "Who can review?" below to
 
 Note: the notebooks in the `course` and `transformers_doc` directories are auto-generated, so are best fixed at their source. Instead, follow the instructions below for these notebooks:
 
-- `course`: Create a post on our forums and tag @lewtun (https://discuss.huggingface.co/c/course/20)
+- `course`: Open a PR directly on the `course` repo (https://github.com/huggingface/course)
 - `transformers_doc`: Open a PR directly on the `transformers` repo (https://github.com/huggingface/transformers)
 
 -->
 
@@ -0,0 +1,322 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Transformers, what can they do?"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Install the Transformers, Datasets, and Evaluate libraries to run this notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install datasets evaluate transformers[sentencepiece]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'label': 'POSITIVE', 'score': 0.9598047137260437}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "classifier = pipeline(\"sentiment-analysis\")\n",
+    "classifier(\"I've been waiting for a HuggingFace course my whole life.\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'label': 'POSITIVE', 'score': 0.9598047137260437},\n",
+       " {'label': 'NEGATIVE', 'score': 0.9994558095932007}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "classifier(\n",
+    "    [\"I've been waiting for a HuggingFace course my whole life.\", \"I hate this so much!\"]\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'sequence': 'This is a course about the Transformers library',\n",
+       " 'labels': ['education', 'business', 'politics'],\n",
+       " 'scores': [0.8445963859558105, 0.111976258456707, 0.043427448719739914]}"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "classifier = pipeline(\"zero-shot-classification\")\n",
+    "classifier(\n",
+    "    \"This is a course about the Transformers library\",\n",
+    "    candidate_labels=[\"education\", \"politics\", \"business\"],\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'generated_text': 'In this course, we will teach you how to understand and use '\n",
+       "                    'data flow and data interchange when handling user data. We '\n",
+       "                    'will be working with one or more of the most commonly used '\n",
+       "                    'data flows — data flows of various types, as seen by the '\n",
+       "                    'HTTP'}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "generator = pipeline(\"text-generation\")\n",
+    "generator(\"In this course, we will teach you how to\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'generated_text': 'In this course, we will teach you how to manipulate the world and '\n",
+       "                    'move your mental and physical capabilities to your advantage.'},\n",
+       " {'generated_text': 'In this course, we will teach you how to become an expert and '\n",
+       "                    'practice realtime, and with a hands on experience on both real '\n",
+       "                    'time and real'}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "generator = pipeline(\"text-generation\", model=\"distilgpt2\")\n",
+    "generator(\n",
+    "    \"In this course, we will teach you how to\",\n",
+    "    max_length=30,\n",
+    "    num_return_sequences=2,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'sequence': 'This course will teach you all about mathematical models.',\n",
+       "  'score': 0.19619831442832947,\n",
+       "  'token': 30412,\n",
+       "  'token_str': ' mathematical'},\n",
+       " {'sequence': 'This course will teach you all about computational models.',\n",
+       "  'score': 0.04052725434303284,\n",
+       "  'token': 38163,\n",
+       "  'token_str': ' computational'}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "unmasker = pipeline(\"fill-mask\")\n",
+    "unmasker(\"This course will teach you all about <mask> models.\", top_k=2)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'entity_group': 'PER', 'score': 0.99816, 'word': 'Sylvain', 'start': 11, 'end': 18}, \n",
+       " {'entity_group': 'ORG', 'score': 0.97960, 'word': 'Hugging Face', 'start': 33, 'end': 45}, \n",
+       " {'entity_group': 'LOC', 'score': 0.99321, 'word': 'Brooklyn', 'start': 49, 'end': 57}\n",
+       "]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "ner = pipeline(\"ner\", grouped_entities=True)\n",
+    "ner(\"My name is Sylvain and I work at Hugging Face in Brooklyn.\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'score': 0.6385916471481323, 'start': 33, 'end': 45, 'answer': 'Hugging Face'}"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "question_answerer = pipeline(\"question-answering\")\n",
+    "question_answerer(\n",
+    "    question=\"Where do I work?\",\n",
+    "    context=\"My name is Sylvain and I work at Hugging Face in Brooklyn\",\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'summary_text': ' America has changed dramatically during recent years . The '\n",
+       "                  'number of engineering graduates in the U.S. has declined in '\n",
+       "                  'traditional engineering disciplines such as mechanical, civil '\n",
+       "                  ', electrical, chemical, and aeronautical engineering . Rapidly '\n",
+       "                  'developing economies such as China and India, as well as other '\n",
+       "                  'industrial countries in Europe and Asia, continue to encourage '\n",
+       "                  'and advance engineering .'}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "summarizer = pipeline(\"summarization\")\n",
+    "summarizer(\n",
+    "    \"\"\"\n",
+    "    America has changed dramatically during recent years. Not only has the number of \n",
+    "    graduates in traditional engineering disciplines such as mechanical, civil, \n",
+    "    electrical, chemical, and aeronautical engineering declined, but in most of \n",
+    "    the premier American universities engineering curricula now concentrate on \n",
+    "    and encourage largely the study of engineering science. As a result, there \n",
+    "    are declining offerings in engineering subjects dealing with infrastructure, \n",
+    "    the environment, and related issues, and greater concentration on high \n",
+    "    technology subjects, largely supporting increasingly complex scientific \n",
+    "    developments. While the latter is important, it should not be at the expense \n",
+    "    of more traditional engineering.\n",
+    "\n",
+    "    Rapidly developing economies such as China and India, as well as other \n",
+    "    industrial countries in Europe and Asia, continue to encourage and advance \n",
+    "    the teaching of engineering. Both China and India, respectively, graduate \n",
+    "    six and eight times as many traditional engineers as does the United States. \n",
+    "    Other industrial countries at minimum maintain their output, while America \n",
+    "    suffers an increasingly serious decline in the number of engineering graduates \n",
+    "    and a lack of well-educated engineers.\n",
+    "\"\"\"\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "[{'translation_text': 'This course is produced by Hugging Face.'}]"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "translator = pipeline(\"translation\", model=\"Helsinki-NLP/opus-mt-fr-en\")\n",
+    "translator(\"Ce cours est produit par Hugging Face.\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "colab": {
+   "name": "Transformers, what can they do?",
+   "provenance": []
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
@@ -0,0 +1,63 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Bias and limitations"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Install the Transformers, Datasets, and Evaluate libraries to run this notebook."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install datasets evaluate transformers[sentencepiece]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "['lawyer', 'carpenter', 'doctor', 'waiter', 'mechanic']\n",
+       "['nurse', 'waitress', 'teacher', 'maid', 'prostitute']"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "unmasker = pipeline(\"fill-mask\", model=\"bert-base-uncased\")\n",
+    "result = unmasker(\"This man works as a [MASK].\")\n",
+    "print([r[\"token_str\"] for r in result])\n",
+    "\n",
+    "result = unmasker(\"This woman works as a [MASK].\")\n",
+    "print([r[\"token_str\"] for r in result])"
+   ]
+  }
+ ],
+ "metadata": {
+  "colab": {
+   "name": "Bias and limitations",
+   "provenance": []
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}