diff --git "a/stella_en_400m_obliqa.ipynb" "b/stella_en_400m_obliqa.ipynb" new file mode 100644--- /dev/null +++ "b/stella_en_400m_obliqa.ipynb" @@ -0,0 +1,10031 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "byfhCh_mJB_K", + "outputId": "fe485abb-ca7c-45a0-c493-e8c7cde3b9f1" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Collecting git+https://github.com/huggingface/accelerate\n", + " Cloning https://github.com/huggingface/accelerate to /tmp/pip-req-build-jjzy91h2\n", + " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/accelerate /tmp/pip-req-build-jjzy91h2\n", + " Resolved https://github.com/huggingface/accelerate to commit e11d3ceff3a49378796cdff5b466586d877d5c60\n", + " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", + " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", + " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", + "Requirement already satisfied: numpy<3.0.0,>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (1.26.4)\n", + "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (24.2)\n", + "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (5.9.5)\n", + "Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (6.0.2)\n", + "Requirement already satisfied: torch>=1.10.0 in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (2.5.1+cu121)\n", + "Requirement already satisfied: huggingface_hub>=0.21.0 in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (0.26.2)\n", + "Requirement already satisfied: safetensors>=0.4.3 in /usr/local/lib/python3.10/dist-packages (from accelerate==1.2.0.dev0) (0.4.5)\n", + "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (3.16.1)\n", + "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (2024.10.0)\n", + "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (2.32.3)\n", + "Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (4.66.6)\n", + "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (4.12.2)\n", + "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate==1.2.0.dev0) (3.4.2)\n", + "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate==1.2.0.dev0) (3.1.4)\n", + "Requirement already satisfied: sympy==1.13.1 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate==1.2.0.dev0) (1.13.1)\n", + "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from sympy==1.13.1->torch>=1.10.0->accelerate==1.2.0.dev0) (1.3.0)\n", + "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.10.0->accelerate==1.2.0.dev0) (3.0.2)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (3.4.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (3.10)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (2.2.3)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub>=0.21.0->accelerate==1.2.0.dev0) (2024.8.30)\n", + "Building wheels for collected packages: accelerate\n", + " Building wheel for accelerate (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", + " Created wheel for accelerate: filename=accelerate-1.2.0.dev0-py3-none-any.whl size=334925 sha256=fe7e7fe23693551890b431567674db7621ed125f02fa185baf8c2737226c7307\n", + " Stored in directory: /tmp/pip-ephem-wheel-cache-ex33hk33/wheels/f6/c7/9d/1b8a5ca8353d9307733bc719107acb67acdc95063bba749f26\n", + "Successfully built accelerate\n", + "Installing collected packages: accelerate\n", + " Attempting uninstall: accelerate\n", + " Found existing installation: accelerate 1.1.1\n", + " Uninstalling accelerate-1.1.1:\n", + " Successfully uninstalled accelerate-1.1.1\n", + "Successfully installed accelerate-1.2.0.dev0\n" + ] + } + ], + "source": [ + "!pip install git+https://github.com/huggingface/accelerate\n" + ] + }, + { + "cell_type": "code", + "source": [ + "!pip install -qqqU xformers" + ], + "metadata": { + "id": "BFDAPw3lLh-J", + "colab": { + "base_uri": "https://localhost:8080/" + }, + "outputId": "8054de24-df98-45a3-fbc5-77fa71bc5ddb" + }, + "execution_count": null, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/16.7 MB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[91m╸\u001b[0m\u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.3/16.7 MB\u001b[0m \u001b[31m8.0 MB/s\u001b[0m eta \u001b[36m0:00:03\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━\u001b[0m\u001b[91m╸\u001b[0m\u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.7/16.7 MB\u001b[0m \u001b[31m53.9 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[90m╺\u001b[0m\u001b[90m━━━━━━━━━━━━━━━\u001b[0m \u001b[32m10.0/16.7 MB\u001b[0m \u001b[31m96.4 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[91m╸\u001b[0m \u001b[32m16.7/16.7 MB\u001b[0m \u001b[31m211.7 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[91m╸\u001b[0m \u001b[32m16.7/16.7 MB\u001b[0m \u001b[31m211.7 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m16.7/16.7 MB\u001b[0m \u001b[31m93.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "import os\n", + "# Disable all integrations like WandB explicitly using the --report_to flag\n", + "os.environ[\"TRANSFORMERS_NO_LOGGING\"] = \"true\"\n", + "os.environ[\"WANDB_MODE\"] = \"disabled\"" + ], + "metadata": { + "id": "mY-Nkz3qM4AB" + }, + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "ANFexbEi5IWE", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 1000, + "referenced_widgets": [ + "006a724e98cd493ca0ce77169a472148", + "4b1d4195413645f1ad1e52a435db6387", + "18120c9035104c05bb2c0f1b43939e20", + "fa38d90c7ade4800b354cc6a6f3f4766", + "5dc762206db44de49341e399ec05545c", + "4601dd2eca5b40c0ba89f364d4c397b1", + "4413a301852747b9b3e47546408d6781", + "b74d73e69fc84a1fb117e7f7c7e6e65d", + "76c94700104f44cf9dd13461b0ef870a", + "9fb03f1cde9745ab8538c73babc3be0e", + "16f1a6b4a1f94d64be6a905f3775aa22", + "9f9dd00eed0346e4b0cd58365ff7bc79", + "1db654ed3d6744feaf96cde37f6bffda", + "bfd3eb664d58447d989f0c3b41a91412", + "4b47c1cb44cb4483bddd247b9312faef", + "b6f5b8d4831e490496040fe5dc8bd68b", + "1ca2c08d187d42c39091a7fd93bf255d", + "677d572591474e77ad3e6985cbf32d2b", + "7365be1202ce4ce692dfbeb1eda99c9a", + "94e802e61d984453ab56e0482da64ed6", + "f2ea92fb105142b6ac2a345333ec6183", + "df9b1630c11b4a85a5453235f1b184ab", + "65711503ae1545e0aa5f949f4babc06f", + "c0a8632d992c40e7ac7a8aa1e0a5a62a", + "28821b38a3cd4f3a972924c3d514cff6", + "272b324b71eb4e0b9b9ba25d8f596dc7", + "27fb7abe5ea64dca922eafffd9113aad", + "5434c3ba27ef42ee91add1e3d6e45bc6", + "adeb95b1bf0b4170870a7af036ff907a", + "a8ca0ece0bbe4b92b2c6dd616f733d20", + "c8d7f959cef84bd98e0a3b737b34b094", + "6f53cf8614994c0ea62ff74dcc66fd5f", + "5ca129ba9ee942bfba6d285b2fe173e2", + "0b950b7e32de47eca6d271c7a2aaa391", + "6233f6e82d9b4243a3a4d7fb95f4968c", + "3e193ba2fe224336a83f751494a263fd", + "909c2e91d8a144a0a243f027d3f55671", + "fb21c64b0a1d445895293d7427d50393", + "53a6750261904e4e9abbd9d21979c4dd", + "911716902b6c48d7a2548e1ef68edfcb", + "e7468ddbf9f441b1bed23dd4a8012b4e", + "7acd505317ad42828b71c67bd93ed817", + "b41789928fd346dd9c82dfa9d4dbb267", + "424c5618af0c4175a4afa1d6b64ed5bf", + "3d5973fc5633454c808d849f3178edb9", + "da8e718a09184740b1a0beb09c144dde", + "87c9bf35261d4e8894e2fe96e6ebf4ee", + "4ee7363e97a64e399f1d994683cf29b6", + "242d07cb72b1464aa0cbb9f9b148b5b1", + "8919073a1ec443439945d2804cf53369", + "f22248e97eee47528a4d5d801667e23e", + "b50c567baf63448a84cd0358c9e238f4", + "a1a05da0ac8a47708b8c95b2829b35cc", + "58261680472946289deb2ce044974491", + "5646acb6f8d74d7992515d9d2f19cf43", + "a9e769e12bfd4fdc9eb9611acc2ebe3c", + "6b464699737540f7adc7496eef70c703", + "f789c34e97b446e8b5417006fef44411", + "bc6e0b3e007945abbff3860c7bad40e1", + "97cffdde5d7249c6a7187d9558ef72f2", + "8bbda8415ca548d087802dbebc5bf552", + "2746906236614ddb82ac512b0da12896", + "4b138e49b7584360b134ff203d57067c", + "d2720f7926b44387a5c74eee55a2539b", + "5baf445aef6f4d50b09d75310e275a84", + "2025ed16775a43b384d42dd63e95e8fc", + "f74d27c20cd64e8f87d0b7faa178266b", + "e83a560e637d4a8aadba1afcad90028c", + "efcb39b8673543e28918a39cb0c24b24", + "32ff42a18860406196667c5a8fa9f949", + "9d0b5bbd62634954a75633a104a3e0ad", + "2d80415fe5c94d049d1126ffeccda07b", + "ad44a159403b4ba38cbed005b709afaf", + "0986153d27644546a3acbf971b07342e", + "0c7490a802944da48510d556f7101ee7", + "82892caeee0e44eb87beaf29989db27e", + "64326555cf4d4143a88aa31ab28464c7", + "b1d76d71ef3d410d9374ef71471a6661", + "d31df3d2183b43b684dcfff1e40c734f", + "b422f5eff29b40a2aac67c88fc35b956", + "ff53694c169b436fba81152a737f013e", + "dfd646ca2fff4e069617301fef594d0d", + "ccaa51de3bf745208ab96e9ca2e96001", + "b1bc0dcf71b04f6f872b5262641d58c6", + "6b6cd26e9e724808836fee776bb27adb", + "0dc9541a58684a3db464d4f6dbbd8db5", + "7a31f3fe61b1474e90cfee50bb6910fa", + "fabd3f9fd0c747c5881fa4cf84e67086", + "bae55224df5741f78fe3e17ef0de4e53", + "dfeeb7494419448db52a5ba0a859b3a4", + "bab2c081d50e4d4ba4a3c344bcdf800a", + "3842d018714646d69ba506250d55079e", + "3cd040b549b540bc8cb53e1ff45d0738", + "afd23acf3a7c4454a84890abd524f793", + "3b3a2c7c187242f6a3878ba280a2fe9c", + "b8591ddff60e4887b324468e9585de4b", + "b05fe5a6704544c98a8854d722a28d6b", + "cef566de3d45400eb65dd4dd8f188863", + "0cb2a580705645e99861671ea46692c2", + "5385277e67b141a5b10150f753b29061", + "52a04b6b15014bdf8ed4ffd030b45c84", + "14a84f827f0f4212912809b490360672", + "bd067d1d62b04182b5e88c836e04c643", + "614908762ca3437b9fc4e3dab29bd18c", + "6e1be86cdf894b3fac0142debccfae21", + "13d6143fc03f4fe2894bb9d072a106b9", + "fbc18d90c03c416fa6cf293110f6fb7e", + "b29f4211cfd64a4b8b4a9550b2748d64", + "4e81d0102bc3405ea764773e78b91052", + "6b27f3b622fd4e53ac1dccf852f567fc", + "263b77cacf474563bd6ed34c29e185fc", + "4b2c412357a34f0a8f57539bacc12e96", + "e96f2cd27f444897b438c2034f8312b0", + "2537156982a146aebf2a211a97a5b768", + "1912b92b34dd429bb1cb81b0f4258119", + "3ce9483411b44eeb868c274cc46c26ef", + "f9d58ba1203643ff9f6fd8876204aaa8", + "f3376e535ff04b8d8d01e6111eb37062", + "7e6c7d355f794ba1b8f1a24ba6c9fdfe", + "22fa2d4180ec493394941c65f8705cac", + "4aa923a5a5534f84a97702974f6ba381", + "7dc90b65c80f4f55b38aa74e63ffc15c", + "f3e30b2d6d484024bb23e4b28d1962a1", + "9c46508954cf49f4bb250ff18b1091a9", + "21997555b8ec4bc9a447e51d941a86ba", + "22122f5e155648f7ab78951be80baa96", + "a98f5ef5b76c454d9296a319c3447196", + "43142b306f7d46aeb98b46d50043fd19", + "8e6dfe21b5b343fe89653e2c7c3e0181", + "ad45d119ba9a46d28d3db8fdedde4b2a", + "6dcaf46a4f834a64b44928dae134c001", + "9309cc1679614ed6a4a93f8ff7e52946", + "b73a7249830e4ad884f0f12d26d31403", + "68d1ce3423fa4f34a6b22114076030bc", + "af158dd45f8346f78781bd32e2e7ad47", + "d9223d36b6a04ef6a45dfd6e9fe93456", + "9e0e860551b645649292506707e80142", + "f423739bf718408180e17ee38ef7569a", + "2f6662dc03154910ac74afcd4b36bf4a", + "2c23aea2b5e246278c92196d1789d313", + "eb26bb9e6dc942e9b7d8b24284f6fbf8", + "5695801789724803aa5da60dbb5417b4", + "14a140271c6b41668e1c438b2bcc647d", + "6e30d7b2389844eb8321d96167257dbf", + "4efed20048304ad98fe5c709df023f2f", + "bdea5a96c4724b14b9f77c601d944236", + "3da5147f41184447910c65f2b695235d", + "57e86acd50af4328b8833f3e28fd5687", + "d5debab101ef438baeb8a195d6b48dff", + "5f3ef839374c4c07858cc42663b48639", + "f0942e9d1ac043269801421aa9565783", + "0ca959210ad94bb8ac1cc9a6aa9ddad3", + "4fc1355864554427a6b7d04011ea9b3c", + "2aa0e706b1b340089beab02320eb511f", + "9017fee2964b42f098e63cab44cc1aab", + "a09acfe96ed84bb48cba7df646fec53b", + "ed463399910d41fcacdfd83c04e9f722", + "3a4051f9b0bf49109ab702bd3036c8f5", + "2cc940e37ffe43358afbbac85f79ae5b", + "5d6da236cc3c488da47abfb4d6423977", + "5adf6cf54b3049c297dae3fdba4e6c84", + "6b3af3d3bb4645b5a9edf76e3a06909d", + "2aa2e61d4ad04ba9b7af7d3ee90b8ee1", + "ef0870f7473c4589922e9bc47328be54", + "1ec19ad6c4c341ce96ab8a557a0b2626", + "3cefe2856faf47dab827b543c672d5ff", + "0ef3b72e704d40a4af7406f64d4d993f", + "47b462a7d07b4b67888c6436eda9c785", + "d0fd2935e9024213bbda1d9464b883e1", + "3180aaf299c943b785966d8e0dfb5680", + "4e1b8e353f8447a7a3c915a2b2c3c124", + "c0eecb82fa324026a19a88de1e5bc8b5", + "2ea594a8c2384ef68b65f3d6aca6b673", + "95aa1616a2064ee588eafa6c6b50282a", + "e32b3f04e6aa42bab7046bc10e26fe57", + "6bc3697159e24899b0561ad56e57a889", + "48ece00d31d040e1a3b35959118bd130", + "36ed4f39fc114d10b5b9d0b91e0c1ed3", + "5a6e7bee9bf448fdac30886bcee687b3", + "94741549c2604d4dacfad53d826e5b7e", + "b5e4965e0d8f4b3bb105771f210a155e", + "607727ab674145c48c1d518dbaff1674", + "5eb53ded83b04d0193722676d28589bd", + "4dbafdefc4bc43deb85eaf12a94c2039", + "18d3e89fb45c4c74ac1070ab0e7c10d2", + "73bc7878891d42818baca220aa136c98", + "8e31ab49cff642a098b063b6c3a8444c", + "293e7c1d2c0141e68d7852b093ac5a88", + "4f05ef3ce4c542e68d8c468022217d40", + "de27bc11dba3479d8f7d56598536a267", + "edc516b7e6b242139708e679661d14f8", + "818b20c8dabd4313ba289f18696832bc", + "d356fc3d80164d529f67355392c279cb", + "b24aefe723154bbca31f5632e0c788ea", + "a3cc0b15be564ec58f1a0a5d5cc22942", + "6eaf795c57cc416c9dca8fd138e91121", + "1a25daea19734fdaaeb5a389de458dfd", + "8a035a15ba6d40e9a038072938913dfd", + "19e68e56612643f0b381e8daf0cd21a0", + "8cd052c7879d426aa65d74e93f608d48", + "c37809ef6b124e90b317d3b440dfaf70", + "805932de89254c89a73ef7aa86380f8c", + "a53918b0174a439f881f081e5e586266", + "fe8c1f75f12f4ffe802b6f13c7a01b91", + "ffda8ab5bce84781a42381fc766a7abb", + "91cdfa9cf20e4e0e96529447761b3182", + "1aa1c0059af24c09b61c09ef36bcd0c8", + "b04b26f176344f9e91abf56c5b949ca8", + "03a59e5ba10e44a485c616428a1a47aa", + "932d81095dc74f3e8c42267a861bfce7", + "45874975a252497d9f6e6fd1f1642b20", + "1d7ab85b01a749f0bac0ba41384c578c", + "8860c9fc21894acdb1c6928aab713c3f", + "49ab6de9bb8946268b282ddf3d626fdb", + "fed683dff76e401b996381ae3f84ad17", + "8a6286ed16554d059b7c5b51359450ff", + "07ee58d8089b4459a5af2c0b6ca5071f", + "296abd5c9fa5460382cd447910707906", + "36b0cfb24b1b4d3c8bc627d3cdd74814", + "38894974b88348e5b9a90b1d1252aa7a", + "2b667b464df6451aba052e7f2930c524", + "ac8308e02ad3422186dc3172ed752bc8", + "c82f246720d34124941259811462be4e", + "3f5e0c22bac441229a34196a944f37f0", + "4189614b67bc4cd992ca9392c6971123", + "1914321179104f709a051d0c77e950e5", + "0531f9d56b8b4676bae4f80e1aa7c1ad", + "b192fc1a01a3448cb211ba9d990a5040", + "5a6443257866492f8c03f49cb846b5e1", + "da5995b0a11a4f9a9cc08c1b5ff25f1a", + "1a82883d8cc34994a1155e289486e21c", + "3cdeecb3fb0347a5ad749da82603746f", + "24217c590100420883e5feae0fbd4aa5", + "9219a3461bfe40069a1d5e3f2da924fd", + "f2979ef7dfc748528ef1c3228b27527a", + "c1ade31b386f4b44bc9c739bdac8ec33", + "1d2938baf40a419394be616d02d2f809", + "23b09808f3264946800993d495f24d9d", + "96b4157c14084fe0a0de653825296619", + "2c6db4458eaa4efaa2c3b7e725567063", + "2c83eadbfe5c4471a2657ff753b58cca", + "3feeeeb0c23a4cae88a3abbe8dccadc0", + "1f82319d44eb4a34a919a54a38bf6549", + "2cc736f5092a4a4cae02ff80f38ba7d8", + "5b3e12d0f72340eaaae0f581095e5aee", + "3bf513048714492b9cbd2bbb2d1d80e1", + "53f8f53c5e6e471991e7f6bb967079d5", + "b19bc3da3b2b422ca921d70c04a45cf3", + "44704a4b66374e0c82f56b67dbabeddf", + "51f9deefd5734d9f8dfa4eb63739bf25", + "2325b4ac53984e10b50dfe80f4e81687", + "15308b31af1a4fa5a452fd25b5eb55ef", + "6211e7711ed04fa982fdfefb03157127", + "ace7a954f0544ca1b9cd19f56603f5a5", + "4f1ea86073024eb69b3dc92bf23f66e8", + "eb0f4a9bb3c049d49cd685511b21f6b4", + "e4aac20ff5344bb088d97a121dffff6f", + "c2762366ea42413a908224e299b23a1f", + "d6ae29c10d6343508490895f88a7dd47", + "62e74d80ed3c48d486cbf66786a7eb47", + "be1dedfda5b34548afab9d6074c99387", + "36c8dcdbbbdc4107807f6e7e3f4832cc", + "fd919145bdd644488219d90b900dac33", + "84cc8504d85646f89685579447dc8517", + "03934ff1821c4bedbf8eaa87c26e1f70", + "41435cf03ad243d0af79fef038180f94", + "6b371cef09464d6390ab78ea50bdc3f2", + "51382268cf02438bb42209da574d084d", + "b3b10aee53e44b06b47ab7255146c53c", + "e5ce2add756a40f4af6e5799289ee98d", + "3c3c6b8b1e9f4063b6eab9d583bce185", + "a20a5b6596f34a4e9f4fd602181574a9", + "92a78f794b424ff389776aff4480add0", + "2a6e939af9034165a621f7e4f2ff5880", + "05c78b5c035e4004ad10230cc7c1eb86", + "9b370c30602e4179ba03c1e26cb54090", + "50259c434ff44210a3c6a395e625ddf5", + "2738d5b1237b420d97b1fcb4366525aa", + "09ba93bfa8d54e8abf64b8febe3bbc55", + "0e30f67bf9d542c6a88ebe4f6ee76146", + "18ed40602f63483fa3648a7d8bb52076", + "4dbc9623e18f4fe9879a04daae747e7b", + "7061e705c05e4037a1bc8e513730c976", + "0ac97bfa827441d699f2c64c0b55e953", + "1ddd52e65a024fda8323bdb15ee2d563", + "c4e21b6e7d1a4daea5dca188ede30882" + ] + }, + "outputId": "222c8a16-9936-43af-c659-bb2c6f6daabd" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/480.6 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[90m╺\u001b[0m \u001b[32m471.0/480.6 kB\u001b[0m \u001b[31m22.5 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m480.6/480.6 kB\u001b[0m \u001b[31m13.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/116.3 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m10.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/179.3 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m179.3/179.3 kB\u001b[0m \u001b[31m13.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/134.8 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m11.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/194.1 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m16.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", + "gcsfs 2024.10.0 requires fsspec==2024.10.0, but you have fsspec 2024.9.0 which is incompatible.\u001b[0m\u001b[31m\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m44.4/44.4 kB\u001b[0m \u001b[31m2.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m9.9/9.9 MB\u001b[0m \u001b[31m91.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m245.3/245.3 kB\u001b[0m \u001b[31m20.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h" + ] + }, + { + "output_type": "stream", + "name": "stderr", + "text": [ + "/usr/local/lib/python3.10/dist-packages/sentence_transformers/cross_encoder/CrossEncoder.py:13: TqdmExperimentalWarning: Using `tqdm.autonotebook.tqdm` in notebook mode. Use `tqdm.tqdm` instead to force console mode (e.g. in jupyter console)\n", + " from tqdm.autonotebook import tqdm, trange\n", + "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_auth.py:94: UserWarning: \n", + "The secret `HF_TOKEN` does not exist in your Colab secrets.\n", + "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n", + "You will be able to reuse this secret in all of your notebooks.\n", + "Please note that authentication is recommended but still optional to access public models or datasets.\n", + " warnings.warn(\n" + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "modules.json: 0%| | 0.00/316 [00:00" + ], + "text/html": [ + "\n", + "
\n", + " \n", + " \n", + " [ 601/11150 16:07 < 4:44:01, 0.62 it/s, Epoch 0.27/5]\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
StepTraining LossValidation LossCosine Accuracy@1Cosine Accuracy@3Cosine Accuracy@5Cosine Accuracy@10Cosine Precision@1Cosine Precision@3Cosine Precision@5Cosine Precision@10Cosine Recall@1Cosine Recall@3Cosine Recall@5Cosine Recall@10Cosine Ndcg@10Cosine Mrr@10Cosine Map@100Dot Accuracy@1Dot Accuracy@3Dot Accuracy@5Dot Accuracy@10Dot Precision@1Dot Precision@3Dot Precision@5Dot Precision@10Dot Recall@1Dot Recall@3Dot Recall@5Dot Recall@10Dot Ndcg@10Dot Mrr@10Dot Map@100
200No logNo log0.6398850.7557390.7819230.8066710.6398850.2651840.1675750.0887730.5628650.6746170.7032880.7329270.6744710.7006780.6394160.5961260.7252510.7600430.7962700.5961260.2533480.1624820.0873390.5282220.6494620.6840150.7223880.6495680.6669840.611385
400No logNo log0.6531560.7578910.7855090.8091820.6531560.2654230.1684360.0893830.5732840.6755080.7051710.7358080.6810550.7095500.6472460.6176470.7367290.7718790.8048780.6176470.2584890.1654950.0885220.5439740.6582680.6931250.7305770.6619090.6833940.624376

" + ] + }, + "metadata": {} + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "Batches: 0%| | 0/88 [00:00