diff --git "a/run_evaluations_on_common_voice_test_7_0.ipynb" "b/run_evaluations_on_common_voice_test_7_0.ipynb"
new file mode 100644--- /dev/null
+++ "b/run_evaluations_on_common_voice_test_7_0.ipynb"
@@ -0,0 +1,3217 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "c8c824ea",
+ "metadata": {},
+ "source": [
+ "
TRhis notebook is for testing models against common_voice (v7)
"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "a9180c0b",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "source": [
+ "\n",
+ "\n",
+ "\n",
+ "##### TEST WITH RASMUS 1B model with language model added using our own common_voice v7 (processed before event) ###"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "0ea4e3d0",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [],
+ "source": [
+ "# Environment settings: \n",
+ "import pandas as pd\n",
+ "pd.set_option('display.max_column', None)\n",
+ "pd.set_option('display.max_rows', None)\n",
+ "pd.set_option('display.max_seq_items', None)\n",
+ "pd.set_option('display.max_colwidth', 500)\n",
+ "pd.set_option('expand_frame_repr', True)\n",
+ "\n",
+ "from datasets import concatenate_datasets, load_dataset"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "0a810556",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "c56f4efc99cc4320a0ddee55f8c6dfce",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ "VBox(children=(HTML(value='\\n\", \"…\", \"–\", \"°\", \"´\", \"ʾ\", \"‹\", \"›\", \"©\", \"®\", \"—\", \"→\", \"。\",\n",
+ " \"、\", \"﹂\", \"﹁\", \"‧\", \"~\", \"﹏\", \",\", \"{\", \"}\", \"(\", \")\", \"[\", \"]\", \"【\", \"】\", \"‥\", \"〽\",\n",
+ " \"『\", \"』\", \"〝\", \"〟\", \"⟨\", \"⟩\", \"〜\", \":\", \"!\", \"?\", \"♪\", \"؛\", \"/\", \"\\\\\", \"º\", \"−\", \"^\", \"ʻ\", \"ˆ\"]\n",
+ "\n",
+ "\n",
+ "chars_to_remove_regex = f\"[{re.escape(''.join(CHARS_TO_IGNORE))}]\"\n",
+ "\n",
+ "def remove_special_characters(batch):\n",
+ " batch[\"sentence\"] = re.sub(chars_to_remove_regex, '', batch[\"sentence\"]).lower()\n",
+ " return batch\n",
+ "\n",
+ "common_voice_test = common_voice_test.map(remove_special_characters)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "42423e76",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Dataset({\n",
+ " features: ['client_id', 'path', 'sentence', 'up_votes', 'down_votes', 'age', 'gender', 'accent', 'locale', 'segment', 'split', 'audio', 'dataset_name', 'filename', '__index_level_0__'],\n",
+ " num_rows: 1599\n",
+ "})"
+ ]
+ },
+ "execution_count": 12,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "common_voice_test"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "id": "21d0937f",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [],
+ "source": [
+ "common_voice_test_audio = common_voice_test.cast_column(\"audio\", Audio(sampling_rate=16_000))\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "id": "02f295cf",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def prepare_dataset(batch):\n",
+ " audio = batch[\"audio\"]\n",
+ "\n",
+ " # batched output is \"un-batched\"\n",
+ " batch[\"input_values\"] = processor(audio[\"array\"], sampling_rate=audio[\"sampling_rate\"]).input_values[0]\n",
+ " batch[\"input_length\"] = len(batch[\"input_values\"])\n",
+ " batch[\"sentence\"] = batch[\"sentence\"]\n",
+ " \n",
+ " with processor.as_target_processor():\n",
+ " batch[\"labels\"] = processor(batch[\"sentence\"]).input_ids\n",
+ " return batch"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "id": "1341388b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "8798d1f90aa241129972f072d31f7686",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ " 0%| | 0/1599 [00:00, ?ex/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "common_voice_test_audio = common_voice_test_audio.map(prepare_dataset)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "id": "fe10fb6d",
+ "metadata": {
+ "collapsed": true,
+ "jupyter": {
+ "outputs_hidden": true
+ }
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'client_id': '635303a7d1e2ea13318960e7d71fd39251278ed8c30a11f4dc2db03ea528e70f67f5474f820bf938baaa12e5b6d6c76520e84ab3714bef5d86c86010f43de21e',\n",
+ " 'path': '/workspace/xlsr_fi/common_voice_fi/clips/common_voice_fi_25838955.mp3',\n",
+ " 'sentence': 'nyt en missään tapauksessa sinua auta',\n",
+ " 'up_votes': '2',\n",
+ " 'down_votes': '0',\n",
+ " 'age': None,\n",
+ " 'gender': None,\n",
+ " 'accent': None,\n",
+ " 'locale': 'fi',\n",
+ " 'segment': None,\n",
+ " 'split': 'test',\n",
+ " 'audio': {'array': [0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " 0.0,\n",
+ " -3.561941713803307e-11,\n",
+ " 3.2315783382586005e-10,\n",
+ " -1.0361054236796008e-09,\n",
+ " 2.637220442025523e-09,\n",
+ " -6.012712994163394e-09,\n",
+ " 1.987172559836381e-08,\n",
+ " 1.6121767032473144e-08,\n",
+ " 3.6444284035042074e-08,\n",
+ " 7.206870833442736e-08,\n",
+ " 3.6768959432720294e-08,\n",
+ " 4.486023996719268e-08,\n",
+ " 5.2210459955404076e-08,\n",
+ " -1.1670257649143423e-08,\n",
+ " 2.1646766157346065e-08,\n",
+ " 4.6971187828148686e-08,\n",
+ " -4.548990073516279e-09,\n",
+ " 3.1375012810030967e-08,\n",
+ " -7.115136951840739e-11,\n",
+ " -8.240492732625171e-10,\n",
+ " 2.139185717453529e-09,\n",
+ " -1.0977332820516494e-08,\n",
+ " -1.0940453876173706e-07,\n",
+ " -1.1150990530950367e-07,\n",
+ " 2.9246734811749775e-08,\n",
+ " 7.628233333889511e-08,\n",
+ " -1.643446090326961e-08,\n",
+ " -1.316722944011417e-07,\n",
+ " -1.3977759749650431e-07,\n",
+ " -1.011353774060808e-07,\n",
+ " -4.874259573739437e-08,\n",
+ " 8.274796670093565e-08,\n",
+ " -1.650664316343864e-08,\n",
+ " 4.130545505631744e-08,\n",
+ " 1.5895285798706027e-07,\n",
+ " 1.201868684574947e-07,\n",
+ " 6.451324452427798e-08,\n",
+ " -3.4431671402934683e-10,\n",
+ " 2.6335763436691195e-07,\n",
+ " 3.18770275953284e-07,\n",
+ " 2.2719626713296748e-07,\n",
+ " 5.761494890066388e-07,\n",
+ " 3.9057195522218535e-07,\n",
+ " 2.000890049203008e-07,\n",
+ " 3.24664028994448e-07,\n",
+ " 3.768744250010059e-08,\n",
+ " 1.0992496157768983e-07,\n",
+ " 1.2698909301889216e-07,\n",
+ " -6.927825069169558e-08,\n",
+ " 1.292661266916184e-07,\n",
+ " -4.822758725708809e-08,\n",
+ " -1.3583041891251924e-07,\n",
+ " 2.7037145855501876e-07,\n",
+ " 2.3176689012416318e-07,\n",
+ " -4.818684828933328e-07,\n",
+ " -6.672987638012273e-07,\n",
+ " 1.5273433007223502e-07,\n",
+ " 5.910178515478037e-07,\n",
+ " 9.27804890693551e-08,\n",
+ " -7.832215942471521e-07,\n",
+ " -8.352251938958943e-07,\n",
+ " -7.450622661053785e-07,\n",
+ " -2.90129264612915e-07,\n",
+ " 2.527276876662654e-07,\n",
+ " -1.0289207352798257e-07,\n",
+ " 1.9815753660168411e-07,\n",
+ " 5.346583407117578e-07,\n",
+ " 7.346763482019014e-07,\n",
+ " 2.785272670280392e-07,\n",
+ " 1.334430805854936e-07,\n",
+ " 1.7146596746897558e-06,\n",
+ " 1.2457913953767275e-06,\n",
+ " 2.1926587123743957e-06,\n",
+ " 3.8018922623450635e-06,\n",
+ " 1.694697516541055e-06,\n",
+ " 2.4414789550064597e-06,\n",
+ " 2.2111596535978606e-06,\n",
+ " 1.907394135969298e-07,\n",
+ " 2.1791572635265766e-07,\n",
+ " 8.770623480813811e-07,\n",
+ " 2.9780962904624175e-06,\n",
+ " 2.4453308355987247e-07,\n",
+ " 2.1885378487240814e-07,\n",
+ " 3.6823926166107412e-06,\n",
+ " -2.1835037387063494e-06,\n",
+ " -5.079288257547887e-06,\n",
+ " -3.0982821499492275e-06,\n",
+ " -1.423842604708625e-06,\n",
+ " 1.3861464367437293e-06,\n",
+ " 2.329990365979029e-06,\n",
+ " 1.9110418634227244e-06,\n",
+ " -1.6359018673028913e-06,\n",
+ " -1.998977495532017e-06,\n",
+ " 4.6633394390482863e-07,\n",
+ " 1.3132456615494448e-06,\n",
+ " 1.758200369295082e-06,\n",
+ " 8.826746977774746e-08,\n",
+ " -6.492704187621712e-07,\n",
+ " -2.4907787974370876e-06,\n",
+ " -3.877485596603947e-06,\n",
+ " -2.741990329013788e-06,\n",
+ " 3.3128844734164886e-07,\n",
+ " 2.9659179290320026e-06,\n",
+ " 2.655029675224796e-06,\n",
+ " 6.462948931584833e-06,\n",
+ " 7.908212865004316e-06,\n",
+ " 5.196172423893586e-06,\n",
+ " 4.703387730842223e-06,\n",
+ " 4.296306087780977e-06,\n",
+ " -1.3541003340833413e-07,\n",
+ " -7.3281003096781205e-06,\n",
+ " -5.673833584296517e-06,\n",
+ " -4.883292604063172e-06,\n",
+ " -6.67936774334521e-06,\n",
+ " -9.022893436849699e-07,\n",
+ " 1.6163796772161731e-06,\n",
+ " -4.353416898084106e-07,\n",
+ " 1.8858756902773166e-06,\n",
+ " 7.4389354267623276e-06,\n",
+ " 5.0787298278009985e-06,\n",
+ " 3.3889311907842057e-06,\n",
+ " 5.551770755118923e-06,\n",
+ " 2.1050198029115563e-06,\n",
+ " 4.618770162778674e-06,\n",
+ " 7.528428795922082e-06,\n",
+ " 4.016617822344415e-06,\n",
+ " 1.5532102679571835e-06,\n",
+ " 2.7625362690741895e-06,\n",
+ " 1.0951551665527859e-08,\n",
+ " -4.321609594626352e-06,\n",
+ " 1.2789544143743115e-06,\n",
+ " -6.351413617267099e-08,\n",
+ " 1.7302703270161146e-07,\n",
+ " 2.91728247248102e-06,\n",
+ " -6.733676400472177e-06,\n",
+ " -2.0953893908881582e-06,\n",
+ " 1.7686879800749011e-06,\n",
+ " -3.734821120815468e-06,\n",
+ " -2.1146061044419184e-06,\n",
+ " -9.299872544943355e-06,\n",
+ " -8.123151928884909e-06,\n",
+ " -1.0103318572873832e-06,\n",
+ " -7.416238986479584e-06,\n",
+ " -8.625443115306552e-06,\n",
+ " -4.2274914449080825e-06,\n",
+ " 4.862968580710003e-06,\n",
+ " 2.2065812572691357e-06,\n",
+ " -9.575691365171224e-06,\n",
+ " -1.0196828270636615e-07,\n",
+ " 7.584816330563626e-07,\n",
+ " -2.779610440484248e-06,\n",
+ " 4.86702492707991e-06,\n",
+ " 3.4975362268596655e-06,\n",
+ " 5.2502696235023905e-06,\n",
+ " 8.078756764007267e-06,\n",
+ " 1.2787868399755098e-05,\n",
+ " 9.590833542461041e-06,\n",
+ " 4.597787665261421e-06,\n",
+ " 5.280201548885088e-06,\n",
+ " -1.0549186299613211e-05,\n",
+ " 1.0517466080273152e-06,\n",
+ " 9.001542821351904e-06,\n",
+ " -9.43053328228416e-06,\n",
+ " 2.3615564259671373e-06,\n",
+ " 9.25023073250486e-07,\n",
+ " -4.522394647210604e-06,\n",
+ " 6.797630248911446e-06,\n",
+ " -1.8374051933278679e-06,\n",
+ " -9.992287232307717e-06,\n",
+ " -1.1969301567660295e-06,\n",
+ " 7.970785190991592e-06,\n",
+ " 6.0516017583722714e-06,\n",
+ " 5.552871698455419e-06,\n",
+ " 1.3878839411063382e-07,\n",
+ " 2.738499460974708e-06,\n",
+ " 7.096672561601736e-06,\n",
+ " -5.387410965340678e-06,\n",
+ " -2.6669129056244856e-06,\n",
+ " -7.514609478675993e-06,\n",
+ " -4.906923550151987e-06,\n",
+ " 8.834161235427018e-06,\n",
+ " 3.764742814382771e-06,\n",
+ " -2.0632476207538275e-06,\n",
+ " -9.851145478023682e-06,\n",
+ " -1.8097395013683126e-06,\n",
+ " -4.41548036178574e-06,\n",
+ " -8.050003089010715e-06,\n",
+ " 3.7295653783075977e-06,\n",
+ " 9.57884458330227e-06,\n",
+ " 2.167878301406745e-05,\n",
+ " 9.955059795174748e-06,\n",
+ " 1.0032590580522083e-05,\n",
+ " 2.2280208611391572e-07,\n",
+ " -1.5340559912147e-05,\n",
+ " 6.921275598870125e-06,\n",
+ " -7.953817657835316e-06,\n",
+ " -4.545486717688618e-06,\n",
+ " 5.223021616984624e-06,\n",
+ " -1.1777748113672715e-05,\n",
+ " 1.2032882068524486e-07,\n",
+ " 2.5436368105147267e-06,\n",
+ " -4.007128154626116e-06,\n",
+ " -4.625865130947204e-06,\n",
+ " 6.29075702818227e-06,\n",
+ " -4.9613495320954826e-06,\n",
+ " -8.442878424830269e-06,\n",
+ " 7.333171652135206e-06,\n",
+ " -1.4220910088624805e-05,\n",
+ " 7.928750989094624e-08,\n",
+ " -2.740032641668222e-06,\n",
+ " -2.5021523470059037e-05,\n",
+ " -7.61878573030117e-06,\n",
+ " -1.1419332622608636e-05,\n",
+ " 2.4474932160956087e-06,\n",
+ " 1.485894426878076e-05,\n",
+ " 1.5723710021120496e-05,\n",
+ " 1.260389035451226e-05,\n",
+ " -1.7962748870559153e-06,\n",
+ " 7.697349246882368e-06,\n",
+ " -4.7447772999476e-07,\n",
+ " -9.30458463699324e-06,\n",
+ " -7.958971764310263e-06,\n",
+ " 1.76919650130003e-06,\n",
+ " 1.009684638120234e-05,\n",
+ " -6.442683570639929e-06,\n",
+ " -4.0960849219118245e-06,\n",
+ " -1.1590017493290361e-05,\n",
+ " -1.1500655091367662e-05,\n",
+ " 2.217011115135392e-06,\n",
+ " -7.481859938707203e-06,\n",
+ " -5.08925222675316e-06,\n",
+ " -1.920307340697036e-06,\n",
+ " 6.130998372100294e-06,\n",
+ " 1.5725390767329372e-05,\n",
+ " 1.7182246665470302e-06,\n",
+ " -1.39063422466279e-05,\n",
+ " -4.5249123559187865e-07,\n",
+ " 3.9263750295504e-06,\n",
+ " -1.0580356502032373e-05,\n",
+ " 7.432037818944082e-06,\n",
+ " -7.070829724398209e-06,\n",
+ " -1.3689161278307438e-05,\n",
+ " 1.449103274353547e-05,\n",
+ " -1.0135342563444283e-05,\n",
+ " -1.5745061318739317e-05,\n",
+ " -7.4822410169872455e-06,\n",
+ " -1.1051809451601002e-05,\n",
+ " 4.1868775042530615e-06,\n",
+ " 9.884352948574815e-06,\n",
+ " 1.2161255654064007e-05,\n",
+ " 8.988836270873435e-06,\n",
+ " 1.5586136214551516e-05,\n",
+ " 1.3316592230694368e-05,\n",
+ " 1.9536939817044185e-06,\n",
+ " 1.48480894495151e-05,\n",
+ " 9.775418448043638e-07,\n",
+ " -1.01015457403264e-05,\n",
+ " 1.1648493455140851e-05,\n",
+ " 1.7001255400828086e-05,\n",
+ " 8.68959614308551e-06,\n",
+ " -4.733224614028586e-06,\n",
+ " -3.359599816121772e-07,\n",
+ " 7.296191142813768e-06,\n",
+ " -1.1999553862551693e-05,\n",
+ " -1.108655305870343e-05,\n",
+ " -1.0323303285986185e-05,\n",
+ " -1.2453906492737588e-05,\n",
+ " 2.3685979613219388e-06,\n",
+ " -1.6306898032780737e-05,\n",
+ " -1.947776945598889e-05,\n",
+ " -4.938618076266721e-06,\n",
+ " -1.0393100637884345e-05,\n",
+ " -3.8093040188869054e-07,\n",
+ " -6.0097859204688575e-06,\n",
+ " -1.8376644220552407e-05,\n",
+ " -1.202911062136991e-05,\n",
+ " -1.1844088476209436e-05,\n",
+ " -1.448881630494725e-05,\n",
+ " -4.916828402201645e-06,\n",
+ " 5.875308943359414e-06,\n",
+ " -3.0370817967195762e-06,\n",
+ " -1.955458856173209e-06,\n",
+ " 1.7943366401595995e-06,\n",
+ " -3.5859382023772923e-06,\n",
+ " 1.0365051821281668e-05,\n",
+ " 1.753205833665561e-05,\n",
+ " 6.2291169342643116e-06,\n",
+ " 5.707593118131626e-06,\n",
+ " 1.889043596747797e-05,\n",
+ " 9.10364087758353e-06,\n",
+ " -3.5157472666469403e-06,\n",
+ " 5.5630103190651425e-08,\n",
+ " -2.0768382455571555e-05,\n",
+ " -3.402119182283059e-05,\n",
+ " -2.3694810806773603e-05,\n",
+ " -1.2018410416203551e-05,\n",
+ " -1.0020842637459282e-05,\n",
+ " -7.86699092714116e-06,\n",
+ " 1.1633902431640308e-05,\n",
+ " 1.076963326340774e-05,\n",
+ " 8.003537914191838e-06,\n",
+ " 1.4259092495194636e-05,\n",
+ " 1.0898133041337132e-05,\n",
+ " 6.37884249954368e-06,\n",
+ " -7.718677807133645e-06,\n",
+ " -8.524904842488468e-06,\n",
+ " -7.6022884059057105e-06,\n",
+ " -1.0555138032941613e-05,\n",
+ " -3.5159812341589713e-06,\n",
+ " 7.530075436079642e-06,\n",
+ " 1.0387689144408796e-05,\n",
+ " -8.468977284792345e-06,\n",
+ " -7.88286797615001e-06,\n",
+ " 3.89456454286119e-06,\n",
+ " 8.938662176660728e-06,\n",
+ " 1.5746254575788043e-05,\n",
+ " 1.2848419828515034e-05,\n",
+ " -6.283018592512235e-06,\n",
+ " -4.589786476572044e-05,\n",
+ " -2.8716340239043348e-05,\n",
+ " -5.792558681605442e-07,\n",
+ " -2.4877401301637292e-05,\n",
+ " -6.73655040372978e-06,\n",
+ " 6.9134339355514385e-06,\n",
+ " -6.824921456427546e-06,\n",
+ " -1.2490161680034362e-05,\n",
+ " -2.233146551589016e-05,\n",
+ " 2.481402134435484e-06,\n",
+ " -4.658333523366309e-07,\n",
+ " -9.92243440123275e-06,\n",
+ " 2.0025043340865523e-05,\n",
+ " 2.194338321714895e-06,\n",
+ " -3.986852334492141e-06,\n",
+ " 4.220222763251513e-06,\n",
+ " -3.359585207363125e-06,\n",
+ " 1.6230842447839677e-05,\n",
+ " 1.2539951057988219e-05,\n",
+ " 1.1603340681176633e-05,\n",
+ " 5.009600499761291e-06,\n",
+ " -1.0409043170511723e-05,\n",
+ " 1.0141898201254662e-06,\n",
+ " 3.726794830072322e-06,\n",
+ " 1.5802459529368207e-05,\n",
+ " 7.333504186135542e-07,\n",
+ " -1.2009487363684457e-05,\n",
+ " 6.5643102971080225e-06,\n",
+ " 3.6906267268932424e-06,\n",
+ " 1.251379944733344e-05,\n",
+ " -5.205106845096452e-06,\n",
+ " -1.9450768377282657e-05,\n",
+ " 1.2190085726615507e-05,\n",
+ " -1.8742897736956365e-05,\n",
+ " -3.2488980650668964e-05,\n",
+ " 1.943043571372982e-05,\n",
+ " 1.3126547855790704e-05,\n",
+ " -3.9506840039393865e-06,\n",
+ " -1.137647450377699e-05,\n",
+ " -1.3769224096904509e-05,\n",
+ " -2.776794644887559e-05,\n",
+ " -2.1549516532104462e-05,\n",
+ " 1.0935843420156743e-05,\n",
+ " 9.687621059129015e-06,\n",
+ " 1.8455506506143138e-05,\n",
+ " 4.405374909310922e-08,\n",
+ " -1.1642589925031643e-05,\n",
+ " -7.992652172106318e-06,\n",
+ " -3.035109693882987e-05,\n",
+ " -1.3819481864629779e-05,\n",
+ " 4.22080083808396e-05,\n",
+ " 3.17500380333513e-05,\n",
+ " -2.1308244413376087e-06,\n",
+ " 2.537862201279495e-05,\n",
+ " 2.7118945581605658e-05,\n",
+ " -2.8643494260904845e-06,\n",
+ " 5.2919285735697486e-06,\n",
+ " 1.7594611563254148e-05,\n",
+ " -2.9288825317053124e-05,\n",
+ " -1.917968074849341e-05,\n",
+ " -1.3388311344897375e-05,\n",
+ " -1.6159528968273662e-05,\n",
+ " 1.7609983842703514e-05,\n",
+ " 1.9821449313894846e-05,\n",
+ " 7.935160101624206e-05,\n",
+ " 5.595259426627308e-05,\n",
+ " -1.1405691680010932e-07,\n",
+ " 2.347430563531816e-05,\n",
+ " 3.1654613849241287e-05,\n",
+ " -1.402771317771112e-06,\n",
+ " 1.2425136446836405e-05,\n",
+ " 9.050329026649706e-06,\n",
+ " -3.663960887934081e-05,\n",
+ " -1.0404580280010123e-05,\n",
+ " -1.3193103768571746e-05,\n",
+ " -4.851849007536657e-05,\n",
+ " -4.0840695874067023e-05,\n",
+ " -1.5041036931506824e-05,\n",
+ " -9.056125236384105e-06,\n",
+ " -2.1779609596705996e-05,\n",
+ " 3.7825402614544146e-06,\n",
+ " 9.481176675762981e-06,\n",
+ " -7.935016583360266e-06,\n",
+ " 2.1812393242726102e-05,\n",
+ " -4.389221066958271e-05,\n",
+ " -7.683394505875185e-05,\n",
+ " 3.3046930184355006e-05,\n",
+ " 4.2977382690878585e-05,\n",
+ " 3.317376467748545e-05,\n",
+ " 3.2026033295551315e-05,\n",
+ " -9.251935262000188e-05,\n",
+ " -9.222578955814242e-05,\n",
+ " -9.303420665673912e-05,\n",
+ " -4.8010770115070045e-05,\n",
+ " 3.156602133458364e-06,\n",
+ " -7.737685518804938e-05,\n",
+ " -1.5295167031581514e-05,\n",
+ " -5.255552605376579e-05,\n",
+ " -7.028886466287076e-05,\n",
+ " -1.0162171747651882e-05,\n",
+ " -4.2039981053676456e-05,\n",
+ " -5.52557066839654e-05,\n",
+ " -3.1521640266873874e-06,\n",
+ " 1.7847731214715168e-05,\n",
+ " 5.709413926524576e-06,\n",
+ " 3.611280408222228e-05,\n",
+ " 5.5505715863546357e-05,\n",
+ " 6.15481985732913e-05,\n",
+ " 1.4712682059325743e-05,\n",
+ " -4.145135244471021e-05,\n",
+ " -9.89453328656964e-05,\n",
+ " -7.014871516730636e-05,\n",
+ " -4.869193799095228e-05,\n",
+ " -8.726437226869166e-05,\n",
+ " -3.1136078177951276e-05,\n",
+ " 5.242591578280553e-05,\n",
+ " 9.224986570188776e-05,\n",
+ " 8.003971743164584e-05,\n",
+ " 1.1792234545282554e-05,\n",
+ " 5.2525610954035074e-05,\n",
+ " 0.00016469424008391798,\n",
+ " 0.00013440122711472213,\n",
+ " 7.873043068684638e-05,\n",
+ " -1.849793261499144e-05,\n",
+ " -6.660049984930083e-05,\n",
+ " -0.00011221249587833881,\n",
+ " -0.00020719075109809637,\n",
+ " -0.00012047128984704614,\n",
+ " -2.6872832677327096e-05,\n",
+ " 2.2667696612188593e-05,\n",
+ " -1.969856020878069e-05,\n",
+ " -0.00011491768236737698,\n",
+ " -4.643991633201949e-05,\n",
+ " 4.8707246605772525e-05,\n",
+ " 4.943184831063263e-05,\n",
+ " 7.596169598400593e-05,\n",
+ " 0.00013691159256268293,\n",
+ " 4.322527092881501e-05,\n",
+ " -1.6893087376956828e-05,\n",
+ " 5.0081736844731495e-05,\n",
+ " -2.3035656795400428e-06,\n",
+ " -9.36760552576743e-05,\n",
+ " -6.680106889689341e-05,\n",
+ " -8.163091115420684e-05,\n",
+ " -0.00013901303464081138,\n",
+ " -6.240574293769896e-05,\n",
+ " -6.23687737970613e-05,\n",
+ " -0.00012946980132255703,\n",
+ " -7.874608127167448e-05,\n",
+ " -5.311179847922176e-05,\n",
+ " 6.235996261239052e-05,\n",
+ " 3.246909955123556e-06,\n",
+ " -4.7826069931034e-06,\n",
+ " 8.433376933680847e-05,\n",
+ " 2.6779020117828622e-05,\n",
+ " 6.296257197391242e-05,\n",
+ " 6.666882836725563e-05,\n",
+ " 0.00014777980686631054,\n",
+ " 0.00012131642870372161,\n",
+ " 0.0001089814177248627,\n",
+ " 0.0001243192673427984,\n",
+ " 0.00015571714902762324,\n",
+ " 0.00013959765783511102,\n",
+ " 8.143330342136323e-05,\n",
+ " -2.919105281762313e-05,\n",
+ " 2.356824006710667e-05,\n",
+ " 0.0001330319937551394,\n",
+ " -0.00010654888319550082,\n",
+ " -0.00015104514022823423,\n",
+ " -1.7237294969163486e-06,\n",
+ " -8.616282684670296e-06,\n",
+ " -0.0001304057368542999,\n",
+ " -0.00014792165893595666,\n",
+ " -4.636901576304808e-05,\n",
+ " -5.0104139518225566e-05,\n",
+ " -0.0002990536158904433,\n",
+ " -0.0001611856569070369,\n",
+ " 3.1399344152305275e-05,\n",
+ " -0.000132469751406461,\n",
+ " -0.00018147747323382646,\n",
+ " -0.00010736700642155483,\n",
+ " -2.1295096303219907e-05,\n",
+ " 1.009459901979426e-05,\n",
+ " 1.2799602700397372e-05,\n",
+ " 1.151547985500656e-05,\n",
+ " 6.843547453172505e-05,\n",
+ " 9.606856474420056e-05,\n",
+ " 9.045445767696947e-05,\n",
+ " 6.120488251326606e-05,\n",
+ " 8.441465615760535e-05,\n",
+ " 0.0001641901908442378,\n",
+ " 5.01130307384301e-05,\n",
+ " 0.00015716641792096198,\n",
+ " 0.0002123442682204768,\n",
+ " 0.00014034795458428562,\n",
+ " 4.848799653700553e-05,\n",
+ " -2.2342319425661117e-05,\n",
+ " 0.00013348134234547615,\n",
+ " 3.1830692023504525e-05,\n",
+ " -5.147581032360904e-05,\n",
+ " -3.612533328123391e-05,\n",
+ " -7.694823580095544e-05,\n",
+ " -0.00016058790788520128,\n",
+ " -9.496195707470179e-05,\n",
+ " -0.0001101286688935943,\n",
+ " -0.00013909226981922984,\n",
+ " -1.1063350029871799e-05,\n",
+ " 0.00011010119487764314,\n",
+ " 0.00011600216384977102,\n",
+ " 0.00019023225468117744,\n",
+ " 0.0002426487480988726,\n",
+ " 0.00010992331226589158,\n",
+ " 2.5787114736885997e-06,\n",
+ " 0.00011936755618080497,\n",
+ " 0.00023873141617514193,\n",
+ " 0.00018217964679934084,\n",
+ " -2.7061116270488128e-05,\n",
+ " -0.00022428484226111323,\n",
+ " -0.00021801478578709066,\n",
+ " -0.0003192881995346397,\n",
+ " -0.0002740871859714389,\n",
+ " -0.00019311309733893722,\n",
+ " 2.7026420866604894e-05,\n",
+ " 0.00013078181655146182,\n",
+ " 4.5111806684872136e-05,\n",
+ " -2.0362822397146374e-05,\n",
+ " 9.087563375942409e-05,\n",
+ " 0.0002462242264300585,\n",
+ " 0.0002689131360966712,\n",
+ " 0.00010980955994455144,\n",
+ " 5.090952618047595e-05,\n",
+ " 5.192744356463663e-05,\n",
+ " -6.45309773972258e-05,\n",
+ " -7.519905193476006e-05,\n",
+ " -8.153734233928844e-05,\n",
+ " 7.444979019055609e-06,\n",
+ " 7.776454003760591e-05,\n",
+ " 0.0002075267257168889,\n",
+ " 0.00016918750770855695,\n",
+ " 0.00010674035729607567,\n",
+ " 0.0002108109329128638,\n",
+ " 0.00016350901569239795,\n",
+ " 1.669410448812414e-05,\n",
+ " 3.8646976463496685e-05,\n",
+ " 7.375796849373728e-05,\n",
+ " -2.4458886400680058e-05,\n",
+ " 8.693597010278609e-06,\n",
+ " 5.809446156490594e-05,\n",
+ " 1.191855858451163e-06,\n",
+ " 0.00010823398770298809,\n",
+ " 4.7792374971322715e-05,\n",
+ " -4.514107422437519e-05,\n",
+ " -0.00023841708025429398,\n",
+ " -0.00011803392408182845,\n",
+ " 2.7330122975399718e-05,\n",
+ " 1.1853323485411238e-05,\n",
+ " 0.00019604979024734348,\n",
+ " 0.00013344424951355904,\n",
+ " -5.1348648412385955e-05,\n",
+ " 1.0774405382107943e-05,\n",
+ " -2.9654083846253343e-06,\n",
+ " -8.748386608203873e-05,\n",
+ " 0.00010109435970662162,\n",
+ " 2.6487170543987304e-05,\n",
+ " 3.6564739275490865e-05,\n",
+ " 6.713915354339406e-05,\n",
+ " 4.5191140088718385e-05,\n",
+ " -2.1609097530017607e-05,\n",
+ " -7.378564532700693e-06,\n",
+ " -7.888385880505666e-05,\n",
+ " -0.0002154568792320788,\n",
+ " -0.000145167694427073,\n",
+ " 2.6567699023871683e-05,\n",
+ " 4.369384623714723e-05,\n",
+ " 0.00012208212865516543,\n",
+ " 0.0002858135267160833,\n",
+ " -0.00014620411093346775,\n",
+ " -0.0006079706945456564,\n",
+ " -0.00020936367218382657,\n",
+ " -0.00047369295498356223,\n",
+ " -0.0001054705135175027,\n",
+ " 0.0008836627821438015,\n",
+ " 0.0013496670871973038,\n",
+ " 0.0027453249786049128,\n",
+ " 0.0025710526388138533,\n",
+ " 0.0015551138203591108,\n",
+ " 0.001080634887330234,\n",
+ " 0.0008872239850461483,\n",
+ " 0.0009075886337086558,\n",
+ " 0.0006197893526405096,\n",
+ " 0.000416270864661783,\n",
+ " -0.00016791437519714236,\n",
+ " -0.0007641413831152022,\n",
+ " -0.0007789021474309266,\n",
+ " -0.001357047469355166,\n",
+ " -0.0012476093834266067,\n",
+ " 8.782377699390054e-05,\n",
+ " 0.0004825028299819678,\n",
+ " -0.0001709852513158694,\n",
+ " -0.0005816190387122333,\n",
+ " -0.00017099850811064243,\n",
+ " -0.00016036740271374583,\n",
+ " -0.00011844086839118972,\n",
+ " 0.0011871791211888194,\n",
+ " 0.0016316876281052828,\n",
+ " 0.0006828965269960463,\n",
+ " 0.0004519265203271061,\n",
+ " 0.001074681174941361,\n",
+ " 0.0010790082160383463,\n",
+ " 0.0009858141420409083,\n",
+ " 0.0010932921431958675,\n",
+ " 0.0005609282525256276,\n",
+ " -2.288190989929717e-05,\n",
+ " -0.00033438880927860737,\n",
+ " 0.000139948635478504,\n",
+ " -1.0142367500520777e-05,\n",
+ " -6.889018550282344e-05,\n",
+ " 0.00016957070329226553,\n",
+ " -0.0003424382593948394,\n",
+ " -0.0007459634216502309,\n",
+ " -0.0005430167657323182,\n",
+ " -0.00038140465039759874,\n",
+ " -0.00017398179625160992,\n",
+ " 7.747487984488544e-07,\n",
+ " -0.000396851624827832,\n",
+ " -0.00044070163858123124,\n",
+ " -0.000595868390519172,\n",
+ " -0.0005878267111256719,\n",
+ " -0.00023124573635868728,\n",
+ " -0.00020316074369475245,\n",
+ " -0.00024531196686439216,\n",
+ " 3.986380033893511e-05,\n",
+ " 0.00011146595352329314,\n",
+ " -2.4453678634017706e-05,\n",
+ " -0.0006906524649821222,\n",
+ " -0.0009093093685805798,\n",
+ " -0.00051727524260059,\n",
+ " -0.0006183372461237013,\n",
+ " -0.0006579476175829768,\n",
+ " -0.000635930395219475,\n",
+ " -0.0006922201719135046,\n",
+ " -0.0004303935857024044,\n",
+ " -0.0005302050849422812,\n",
+ " -0.00024216649762820452,\n",
+ " 0.00023431211593560874,\n",
+ " 0.00011247658403590322,\n",
+ " 0.00018101415480487049,\n",
+ " -0.00018178665777668357,\n",
+ " -0.00042956657125614583,\n",
+ " -0.00017226941417902708,\n",
+ " -0.0001543180551379919,\n",
+ " -7.395684951916337e-05,\n",
+ " 0.00019948300905525684,\n",
+ " 0.00046221629600040615,\n",
+ " 0.0005982925067655742,\n",
+ " 0.0004946643020957708,\n",
+ " 0.0006673666648566723,\n",
+ " 0.0005782609805464745,\n",
+ " 0.0009611182613298297,\n",
+ " 0.0011338695185258985,\n",
+ " 0.0007775807753205299,\n",
+ " 0.0008717699674889445,\n",
+ " 0.0006845758762210608,\n",
+ " 0.0004492047009989619,\n",
+ " 0.0008688060333952308,\n",
+ " 0.0008808042039163411,\n",
+ " 0.0006824168376624584,\n",
+ " 0.0008754846639931202,\n",
+ " 0.0009170355042442679,\n",
+ " 0.0008947315509431064,\n",
+ " 0.00037638196954503655,\n",
+ " 0.00012063443864462897,\n",
+ " 0.0001205943917739205,\n",
+ " -0.00027893096557818353,\n",
+ " -0.00034151668660342693,\n",
+ " 4.072048614034429e-05,\n",
+ " 0.00039558170828968287,\n",
+ " 0.00036184664350003004,\n",
+ " 0.0002830892044585198,\n",
+ " 0.00034134864108636975,\n",
+ " 0.00018620165064930916,\n",
+ " 0.00010010011465055868,\n",
+ " -0.0010110342409461737,\n",
+ " -0.0014716117875650525,\n",
+ " -0.00143453071359545,\n",
+ " -0.001432304852642119,\n",
+ " -0.0011346882674843073,\n",
+ " -0.001606724807061255,\n",
+ " -0.0016859000315889716,\n",
+ " -0.000970147259067744,\n",
+ " -0.0005429228767752647,\n",
+ " -0.00030031995265744627,\n",
+ " 1.155224526883103e-05,\n",
+ " 3.038569775526412e-05,\n",
+ " 0.00020400401263032109,\n",
+ " 0.0001430936681572348,\n",
+ " 0.00018651645223144442,\n",
+ " 0.00010877644672291353,\n",
+ " 0.00030995538691058755,\n",
+ " -8.552531653549522e-05,\n",
+ " -0.000462948257336393,\n",
+ " -0.00018602913769427687,\n",
+ " -0.0003838155244011432,\n",
+ " -0.0003198512422386557,\n",
+ " -0.00021176040172576904,\n",
+ " 9.72350753727369e-05,\n",
+ " 0.0004510935686994344,\n",
+ " 0.0004399212484713644,\n",
+ " 0.00031747695174999535,\n",
+ " 0.0003753192431759089,\n",
+ " 0.0006823971052654088,\n",
+ " 0.0006168982945382595,\n",
+ " 0.0007508978014811873,\n",
+ " 0.000813269754871726,\n",
+ " 0.0009154973668046296,\n",
+ " 0.0009459103457629681,\n",
+ " 0.0009559307363815606,\n",
+ " 0.0010801347671076655,\n",
+ " 0.0009640233474783599,\n",
+ " 0.0010575958294793963,\n",
+ " 0.0006060840096324682,\n",
+ " 0.00034192067687399685,\n",
+ " 0.0003646048135124147,\n",
+ " 0.0004367087676655501,\n",
+ " 1.916942528623622e-05,\n",
+ " 3.2880798244150355e-05,\n",
+ " 0.00038082696846686304,\n",
+ " 0.00012591760605573654,\n",
+ " -2.8013619157718495e-05,\n",
+ " 0.0001235983509104699,\n",
+ " 1.4137553080217913e-05,\n",
+ " -2.3595706807100214e-05,\n",
+ " 0.0001487635017838329,\n",
+ " -7.12920882506296e-05,\n",
+ " 0.00020064985437784344,\n",
+ " 0.00037825695471838117,\n",
+ " 0.00010225615551462397,\n",
+ " 0.00045870363828726113,\n",
+ " 0.0006968996021896601,\n",
+ " 0.00017369362467434257,\n",
+ " -4.9393267545383424e-05,\n",
+ " 1.6946180039667524e-05,\n",
+ " 4.866662493441254e-05,\n",
+ " -0.0002002955152420327,\n",
+ " -0.0003151880227960646,\n",
+ " -0.0002837583888322115,\n",
+ " 0.00024368561571463943,\n",
+ " 0.0004453646542970091,\n",
+ " 0.0005855893832631409,\n",
+ " 0.0011631479719653726,\n",
+ " 0.0013774990802630782,\n",
+ " 0.0010882096830755472,\n",
+ " 0.0007196713704615831,\n",
+ " 0.00037932785926386714,\n",
+ " 0.00010151328751817346,\n",
+ " -8.730047557037324e-05,\n",
+ " -0.00012939993757754564,\n",
+ " -2.2049964627512963e-06,\n",
+ " -0.00017646400374360383,\n",
+ " -3.2087438739836216e-05,\n",
+ " 0.0001759737788233906,\n",
+ " 0.0003559555334504694,\n",
+ " 0.0005503479042090476,\n",
+ " 0.0006103859050199389,\n",
+ " 0.0002528515178710222,\n",
+ " -0.00012169693945907056,\n",
+ " -0.0001489692076575011,\n",
+ " -0.00019180992967449129,\n",
+ " -0.00040130424895323813,\n",
+ " -0.00041239141137339175,\n",
+ " -0.00045946170575916767,\n",
+ " -0.0005519830738194287,\n",
+ " -0.0007840750622563064,\n",
+ " -0.0008003039401955903,\n",
+ " -0.0007100746151991189,\n",
+ " -0.0006130843539722264,\n",
+ " -0.0004945085966028273,\n",
+ " -0.0004913583979941905,\n",
+ " -0.0006115196738392115,\n",
+ " -0.0006688353605568409,\n",
+ " -0.0005382486269809306,\n",
+ " -0.0005340047646313906,\n",
+ " -0.00046743024722673,\n",
+ " -0.00044509628787636757,\n",
+ " -0.0005086653400212526,\n",
+ " -0.000500195543281734,\n",
+ " -0.00046659092186018825,\n",
+ " -0.0005133801023475826,\n",
+ " -0.00048017987865023315,\n",
+ " -0.0004395547730382532,\n",
+ " -0.0004203759890515357,\n",
+ " -0.00037723666173405945,\n",
+ " -0.0003822047438006848,\n",
+ " -0.00039110504440031946,\n",
+ " -0.0003417454136069864,\n",
+ " -0.0003398265107534826,\n",
+ " -0.0003353268839418888,\n",
+ " -0.0002542625297792256,\n",
+ " -0.00023124455765355378,\n",
+ " -0.00023777743626851588,\n",
+ " -0.00021212473802734166,\n",
+ " -0.00020452585886232555,\n",
+ " -0.000187596699106507,\n",
+ " -0.00019606408022809774,\n",
+ " -0.00020279947784729302,\n",
+ " -0.00017684613703750074,\n",
+ " -0.00017732563719619066,\n",
+ " -0.00014782397192902863,\n",
+ " -0.00011781602370319888,\n",
+ " -8.917415834730491e-05,\n",
+ " -4.9099089665105566e-05,\n",
+ " -8.457600779365748e-05,\n",
+ " -7.757839193800464e-05,\n",
+ " -7.52684791223146e-05,\n",
+ " -8.628296200186014e-05,\n",
+ " -7.74143700255081e-05,\n",
+ " -6.788170867366716e-05,\n",
+ " -3.8799822505097836e-05,\n",
+ " -7.655523950234056e-05,\n",
+ " -8.956620877142996e-05,\n",
+ " -4.282548979972489e-05,\n",
+ " -2.8062066121492535e-05,\n",
+ " -4.497209738474339e-05,\n",
+ " -5.783312735729851e-05,\n",
+ " -5.520653212442994e-05,\n",
+ " -4.530717706074938e-05,\n",
+ " -2.6642175726010464e-05,\n",
+ " -4.3849497160408646e-05,\n",
+ " -5.280814366415143e-05,\n",
+ " -5.956970198894851e-05,\n",
+ " -5.251190668786876e-05,\n",
+ " -3.9139518776210025e-05,\n",
+ " -5.8879733842331916e-05,\n",
+ " -4.6917521103750914e-05,\n",
+ " 6.272055998124415e-06,\n",
+ " -1.0601198482618202e-05,\n",
+ " -9.605543709767517e-06,\n",
+ " -2.3336688173003495e-06,\n",
+ " -2.6358267859905027e-05,\n",
+ " -5.3046933317091316e-05,\n",
+ " -3.4945496736327186e-05,\n",
+ " -2.7895950552192517e-05,\n",
+ " -5.421862078947015e-05,\n",
+ " -3.388076584087685e-05,\n",
+ " -1.8789574824040756e-05,\n",
+ " 1.5857211792535963e-06,\n",
+ " 4.288214768166654e-06,\n",
+ " 2.426012997602811e-06,\n",
+ " 1.3274242519401014e-05,\n",
+ " -2.5067993192351423e-05,\n",
+ " -1.6368256183341146e-05,\n",
+ " -8.23355367174372e-06,\n",
+ " -1.3521567780117039e-05,\n",
+ " -1.4371404176927172e-05,\n",
+ " -1.5501434972975403e-05,\n",
+ " -1.3272861906443723e-05,\n",
+ " -6.009713160892716e-06,\n",
+ " -2.9685018034797395e-06,\n",
+ " -2.059615326288622e-06,\n",
+ " -2.824942555434973e-07,\n",
+ " -4.82729365103296e-06,\n",
+ " 1.7205953554366715e-05,\n",
+ " 1.1110057130281348e-05,\n",
+ " -9.169927579932846e-06,\n",
+ " -5.118149147165241e-06,\n",
+ " -1.637286550248973e-05,\n",
+ " -1.59986229846254e-05,\n",
+ " -2.2341155272442847e-05,\n",
+ " 3.7162412809266243e-06,\n",
+ " 4.918289960187394e-06,\n",
+ " -7.65648564993171e-06,\n",
+ " 1.4572195141226985e-05,\n",
+ " 2.66189563262742e-05,\n",
+ " 1.2821760719816666e-05,\n",
+ " 1.2756045180140063e-06,\n",
+ " 1.3107963241054676e-05,\n",
+ " -5.076688466942869e-06,\n",
+ " -1.2246602636878379e-05,\n",
+ " 5.074427008366911e-06,\n",
+ " 2.2858403099235147e-06,\n",
+ " -1.036216758620867e-06,\n",
+ " -1.4945949260436464e-06,\n",
+ " 5.163407877262216e-06,\n",
+ " 9.527766451356001e-06,\n",
+ " 6.767696959286695e-06,\n",
+ " -3.5286172987980535e-06,\n",
+ " 1.740137236083683e-06,\n",
+ " 3.816123808064731e-06,\n",
+ " 8.83773736859439e-06,\n",
+ " 7.527243269578321e-06,\n",
+ " -3.4768145269481465e-06,\n",
+ " -2.4399348603765247e-06,\n",
+ " 8.783008524915203e-06,\n",
+ " 5.252586106507806e-06,\n",
+ " 5.925839559495216e-06,\n",
+ " 2.6780130610859487e-06,\n",
+ " 1.2405352833866345e-07,\n",
+ " 6.176609076646855e-06,\n",
+ " 2.571237928350456e-06,\n",
+ " 5.796632081001007e-07,\n",
+ " 7.983027899172157e-06,\n",
+ " 1.1482878790047835e-06,\n",
+ " -8.004098503988644e-07,\n",
+ " 8.178865755326115e-06,\n",
+ " 9.541146027913783e-06,\n",
+ " 1.0843723430298269e-05,\n",
+ " 1.7192995073855855e-05,\n",
+ " 1.5891959264990874e-05,\n",
+ " 1.2850301573053002e-05,\n",
+ " 5.590013643086422e-06,\n",
+ " 2.682550530153094e-06,\n",
+ " -1.3775533034277032e-06,\n",
+ " 8.953415090218186e-06,\n",
+ " -1.0984241271216888e-05,\n",
+ " -1.9155572772433516e-06,\n",
+ " -4.706013442046242e-06,\n",
+ " -9.88646388577763e-06,\n",
+ " -1.1609959983616136e-05,\n",
+ " -6.284804840106517e-06,\n",
+ " ...],\n",
+ " 'path': '/workspace/xlsr_fi/common_voice_fi/clips/common_voice_fi_25838955.mp3',\n",
+ " 'sampling_rate': 16000},\n",
+ " 'dataset_name': 'common_voice_fi',\n",
+ " 'filename': 'common_voice_fi_25838955.mp3',\n",
+ " '__index_level_0__': 0.0,\n",
+ " 'input_values': [0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985727136954665,\n",
+ " 0.0004985716659575701,\n",
+ " 0.0004985818522982299,\n",
+ " 0.000498543435242027,\n",
+ " 0.0004986471030861139,\n",
+ " 0.0004984030383639038,\n",
+ " 0.000499133428093046,\n",
+ " 0.0004990276065655053,\n",
+ " 0.0004996009520255029,\n",
+ " 0.0005006061401218176,\n",
+ " 0.0004996101488359272,\n",
+ " 0.0004998384392820299,\n",
+ " 0.0005000458331778646,\n",
+ " 0.000498243432957679,\n",
+ " 0.0004991834284737706,\n",
+ " 0.0004998980439268053,\n",
+ " 0.0004984443658031523,\n",
+ " 0.0004994579940102994,\n",
+ " 0.0004985707346349955,\n",
+ " 0.000498549488838762,\n",
+ " 0.0004986330750398338,\n",
+ " 0.000498262990731746,\n",
+ " 0.0004954858450219035,\n",
+ " 0.0004954264732077718,\n",
+ " 0.0004993979237042367,\n",
+ " 0.0005007250001654029,\n",
+ " 0.0004981090314686298,\n",
+ " 0.0004948575515300035,\n",
+ " 0.0004946288536302745,\n",
+ " 0.0004957191995345056,\n",
+ " 0.000497197441291064,\n",
+ " 0.0005009074229747057,\n",
+ " 0.000498106935992837,\n",
+ " 0.000499738147482276,\n",
+ " 0.0005030575557611883,\n",
+ " 0.0005019637756049633,\n",
+ " 0.0005003929836675525,\n",
+ " 0.000498562993016094,\n",
+ " 0.000506003329064697,\n",
+ " 0.0005075667868368328,\n",
+ " 0.0005049830069765449,\n",
+ " 0.000514828716404736,\n",
+ " 0.0005095926462672651,\n",
+ " 0.0005042182165198028,\n",
+ " 0.0005077330861240625,\n",
+ " 0.0004996360512450337,\n",
+ " 0.0005016742506995797,\n",
+ " 0.000502155686262995,\n",
+ " 0.0004966180422343314,\n",
+ " 0.0005022199475206435,\n",
+ " 0.0004972119932062924,\n",
+ " 0.0004947402630932629,\n",
+ " 0.0005062011769041419,\n",
+ " 0.0005051119951531291,\n",
+ " 0.00048497685929760337,\n",
+ " 0.0004797449801117182,\n",
+ " 0.0005028821178711951,\n",
+ " 0.0005152482190169394,\n",
+ " 0.0005011905450373888,\n",
+ " 0.0004764741752296686,\n",
+ " 0.0004750069056171924,\n",
+ " 0.0004775508714374155,\n",
+ " 0.0004903867375105619,\n",
+ " 0.0005057034431956708,\n",
+ " 0.0004956696066074073,\n",
+ " 0.0005041636759415269,\n",
+ " 0.0005136580439284444,\n",
+ " 0.0005193015676923096,\n",
+ " 0.0005064313299953938,\n",
+ " 0.0005023378180339932,\n",
+ " 0.0005469516618177295,\n",
+ " 0.0005337225738912821,\n",
+ " 0.0005604383768513799,\n",
+ " 0.000605842680670321,\n",
+ " 0.0005463884444907308,\n",
+ " 0.0005674587446264923,\n",
+ " 0.0005609603831544518,\n",
+ " 0.000503954419400543,\n",
+ " 0.0005047211307100952,\n",
+ " 0.0005233189440332353,\n",
+ " 0.0005825993721373379,\n",
+ " 0.0005054721841588616,\n",
+ " 0.0005047476151958108,\n",
+ " 0.0006024710601195693,\n",
+ " 0.00043696537613868713,\n",
+ " 0.00035526114515960217,\n",
+ " 0.0004111550224479288,\n",
+ " 0.0004583991249091923,\n",
+ " 0.0005376826738938689,\n",
+ " 0.0005643131444230676,\n",
+ " 0.0005524925654754043,\n",
+ " 0.0004524159012362361,\n",
+ " 0.0004421717603690922,\n",
+ " 0.0005117302644066513,\n",
+ " 0.0005356257897801697,\n",
+ " 0.0005481801345013082,\n",
+ " 0.0005010631866753101,\n",
+ " 0.0004802536277566105,\n",
+ " 0.0004282956651877612,\n",
+ " 0.0003891698725055903,\n",
+ " 0.0004212077474221587,\n",
+ " 0.0005079199909232557,\n",
+ " 0.0005822557723149657,\n",
+ " 0.0005734841106459498,\n",
+ " 0.0006809241604059935,\n",
+ " 0.0007217021193355322,\n",
+ " 0.0006451821536757052,\n",
+ " 0.0006312783225439489,\n",
+ " 0.0006197924958541989,\n",
+ " 0.0004947521374560893,\n",
+ " 0.00029181112768128514,\n",
+ " 0.00033848610473796725,\n",
+ " 0.0003607911348808557,\n",
+ " 0.00031011507962830365,\n",
+ " 0.0004731146909762174,\n",
+ " 0.0005441787070594728,\n",
+ " 0.00048628958757035434,\n",
+ " 0.0005517824902199209,\n",
+ " 0.0007084615062922239,\n",
+ " 0.0006418685079552233,\n",
+ " 0.0005941910785622895,\n",
+ " 0.0006552153499796987,\n",
+ " 0.0005579656572081149,\n",
+ " 0.0006288908189162612,\n",
+ " 0.0007109865546226501,\n",
+ " 0.0006119011668488383,\n",
+ " 0.0005423963302746415,\n",
+ " 0.0005765173700638115,\n",
+ " 0.0004988817381672561,\n",
+ " 0.0003766389563679695,\n",
+ " 0.000534658320248127,\n",
+ " 0.0004967806744389236,\n",
+ " 0.0005034546484239399,\n",
+ " 0.0005808835267089307,\n",
+ " 0.00030858273385092616,\n",
+ " 0.00043945154175162315,\n",
+ " 0.0005484760040417314,\n",
+ " 0.0003931951359845698,\n",
+ " 0.0004389093373902142,\n",
+ " 0.00023617780243512243,\n",
+ " 0.0002693788555916399,\n",
+ " 0.0004700662975665182,\n",
+ " 0.0002893243217840791,\n",
+ " 0.0002552067453507334,\n",
+ " 0.00037929447717033327,\n",
+ " 0.0006357808597385883,\n",
+ " 0.000560831162147224,\n",
+ " 0.00022839559824205935,\n",
+ " 0.0004956956836394966,\n",
+ " 0.0005199732258915901,\n",
+ " 0.0004201463016215712,\n",
+ " 0.0006358952959999442,\n",
+ " 0.0005972553044557571,\n",
+ " 0.0006467084749601781,\n",
+ " 0.0007265140302479267,\n",
+ " 0.0008593810489401221,\n",
+ " 0.0007691770442761481,\n",
+ " 0.0006282987887971103,\n",
+ " 0.0006475530681200325,\n",
+ " 0.0002009285381063819,\n",
+ " 0.0005282476195134223,\n",
+ " 0.0007525502587668598,\n",
+ " 0.00023249122023116797,\n",
+ " 0.0005652037798427045,\n",
+ " 0.0005246721557341516,\n",
+ " 0.00037097380845807493,\n",
+ " 0.0006903671310283244,\n",
+ " 0.0004467305261641741,\n",
+ " 0.00021664139057975262,\n",
+ " 0.000464801472844556,\n",
+ " 0.0007234676158986986,\n",
+ " 0.0006693180184811354,\n",
+ " 0.0006552464328706264,\n",
+ " 0.00050248863408342,\n",
+ " 0.0005758391926065087,\n",
+ " 0.0006988045643083751,\n",
+ " 0.00034656748175621033,\n",
+ " 0.0004233260406181216,\n",
+ " 0.0002865488058887422,\n",
+ " 0.0003601243661250919,\n",
+ " 0.0007478276384063065,\n",
+ " 0.0006047945353202522,\n",
+ " 0.000440358417108655,\n",
+ " 0.00022062368225306273,\n",
+ " 0.0004475110908970237,\n",
+ " 0.0003739903913810849,\n",
+ " 0.0002714427246246487,\n",
+ " 0.0006038019782863557,\n",
+ " 0.0007688387995585799,\n",
+ " 0.0011102372081950307,\n",
+ " 0.0007794536650180817,\n",
+ " 0.0007816411671228707,\n",
+ " 0.0005048590828664601,\n",
+ " 6.574044527951628e-05,\n",
+ " 0.000693855807185173,\n",
+ " 0.0002741565986070782,\n",
+ " 0.00037032226100564003,\n",
+ " 0.0006459396681748331,\n",
+ " 0.00016626479919068515,\n",
+ " 0.0005019677337259054,\n",
+ " 0.0005703411297872663,\n",
+ " 0.00038551201578229666,\n",
+ " 0.0003680544323287904,\n",
+ " 0.0006760657415725291,\n",
+ " 0.00035858876071870327,\n",
+ " 0.00026035780319944024,\n",
+ " 0.0007054773741401732,\n",
+ " 9.733124170452356e-05,\n",
+ " 0.0005008098087273538,\n",
+ " 0.0004212629864923656,\n",
+ " -0.00020740691979881376,\n",
+ " 0.0002836094645317644,\n",
+ " 0.0001763774489518255,\n",
+ " 0.0005676284781657159,\n",
+ " 0.0009178163018077612,\n",
+ " 0.0009422154980711639,\n",
+ " 0.00085419014794752,\n",
+ " 0.0004478909831959754,\n",
+ " 0.0007157525978982449,\n",
+ " 0.0004851853591389954,\n",
+ " 0.00023604484158568084,\n",
+ " 0.0002740111667662859,\n",
+ " 0.000548490381333977,\n",
+ " 0.0007834541611373425,\n",
+ " 0.000316793069941923,\n",
+ " 0.00038300210144370794,\n",
+ " 0.0001715615944704041,\n",
+ " 0.0001740829466143623,\n",
+ " 0.0005611254600808024,\n",
+ " 0.00028747282340191305,\n",
+ " 0.0003549800021573901,\n",
+ " 0.0004443914513103664,\n",
+ " 0.0006715581985190511,\n",
+ " 0.0009422628791071475,\n",
+ " 0.0005470522446557879,\n",
+ " 0.00010620674584060907,\n",
+ " 0.0004858057072851807,\n",
+ " 0.0006093549891375005,\n",
+ " 0.00020004907855764031,\n",
+ " 0.0007082668598741293,\n",
+ " 0.00029907000134699047,\n",
+ " 0.0001123344773077406,\n",
+ " 0.0009074356639757752,\n",
+ " 0.00021260509674903005,\n",
+ " 5.4327480029314756e-05,\n",
+ " 0.0002874620840884745,\n",
+ " 0.0001867470855358988,\n",
+ " 0.0006167049868963659,\n",
+ " 0.0007774586556479335,\n",
+ " 0.0008417012286372483,\n",
+ " 0.0007521917577832937,\n",
+ " 0.0009383338619954884,\n",
+ " 0.0008742989739403129,\n",
+ " 0.0005536960088647902,\n",
+ " 0.0009175100130960345,\n",
+ " 0.0005261539481580257,\n",
+ " 0.0002135586692020297,\n",
+ " 0.000827233714517206,\n",
+ " 0.0009782613487914205,\n",
+ " 0.0007437487365677953,\n",
+ " 0.0003650252765510231,\n",
+ " 0.0004890936543233693,\n",
+ " 0.0007044340018182993,\n",
+ " 0.00016000657342374325,\n",
+ " 0.00018576679576653987,\n",
+ " 0.00020730181131511927,\n",
+ " 0.00014718706370331347,\n",
+ " 0.0005654024425894022,\n",
+ " 3.8475314795505255e-05,\n",
+ " -5.099048576084897e-05,\n",
+ " 0.0003592301218304783,\n",
+ " 0.00020533248607534915,\n",
+ " 0.0004878247855231166,\n",
+ " 0.00032900721998885274,\n",
+ " -1.992235229408834e-05,\n",
+ " 0.000159172632265836,\n",
+ " 0.00016439301543869078,\n",
+ " 8.97723002708517e-05,\n",
+ " 0.00035984491114504635,\n",
+ " 0.0006643439410254359,\n",
+ " 0.0004128817527089268,\n",
+ " 0.0004433996509760618,\n",
+ " 0.0005491997580975294,\n",
+ " 0.00039739583735354245,\n",
+ " 0.0007910215645097196,\n",
+ " 0.000993237947113812,\n",
+ " 0.0006743265548720956,\n",
+ " 0.0006596118328161538,\n",
+ " 0.001031564432196319,\n",
+ " 0.0007554310141131282,\n",
+ " 0.0003993762657046318,\n",
+ " 0.0005001422832719982,\n",
+ " -8.740499470150098e-05,\n",
+ " -0.00046133159776218235,\n",
+ " -0.00016997386410366744,\n",
+ " 0.00015947454085107893,\n",
+ " 0.00021583569468930364,\n",
+ " 0.00027660641353577375,\n",
+ " 0.0008268220699392259,\n",
+ " 0.0008024367270991206,\n",
+ " 0.0007243917207233608,\n",
+ " 0.0009008915512822568,\n",
+ " 0.0008060623658820987,\n",
+ " 0.0006785510922782123,\n",
+ " 0.0002807910495903343,\n",
+ " 0.0002580434374976903,\n",
+ " 0.0002840749511960894,\n",
+ " 0.00020076060900464654,\n",
+ " 0.0003993696882389486,\n",
+ " 0.0007110330043360591,\n",
+ " 0.0007916602189652622,\n",
+ " 0.00025962141808122396,\n",
+ " 0.00027615841827355325,\n",
+ " 0.0006084574852138758,\n",
+ " 0.0007507761474698782,\n",
+ " 0.0009428516495972872,\n",
+ " 0.0008610895602032542,\n",
+ " 0.0003212980227544904,\n",
+ " -0.0007964306860230863,\n",
+ " -0.0003116557782050222,\n",
+ " 0.00048222907935269177,\n",
+ " -0.0002033405180554837,\n",
+ " 0.0003085016505792737,\n",
+ " 0.00069363450165838,\n",
+ " 0.00030600829632021487,\n",
+ " 0.0001461641222704202,\n",
+ " -0.00013150721497368068,\n",
+ " 0.0005685851792804897,\n",
+ " 0.00048542924923822284,\n",
+ " 0.00021861227287445217,\n",
+ " 0.0010635771322995424,\n",
+ " 0.0005604856996797025,\n",
+ " 0.00038608410977758467,\n",
+ " 0.0006176458555273712,\n",
+ " 0.0004037823819089681,\n",
+ " 0.0009565242216922343,\n",
+ " 0.0008523861179128289,\n",
+ " 0.0008259597234427929,\n",
+ " 0.0006399180856533349,\n",
+ " 0.0002048826718237251,\n",
+ " 0.0005271880072541535,\n",
+ " 0.000603723805397749,\n",
+ " 0.0009444374591112137,\n",
+ " 0.0005192641401663423,\n",
+ " 0.0001597263035364449,\n",
+ " 0.0006837840192019939,\n",
+ " 0.000602703366894275,\n",
+ " 0.0008516482193954289,\n",
+ " 0.0003517111763358116,\n",
+ " -5.0228652980877087e-05,\n",
+ " 0.000842514680698514,\n",
+ " -3.0256156605901197e-05,\n",
+ " -0.00041810041875578463,\n",
+ " 0.001046800403855741,\n",
+ " 0.0008689368842169642,\n",
+ " 0.0003871045773848891,\n",
+ " 0.00017758669855538756,\n",
+ " 0.00011007551802322268,\n",
+ " -0.0002848969597835094,\n",
+ " -0.00010944460518658161,\n",
+ " 0.0008071264019235969,\n",
+ " 0.0007719079148955643,\n",
+ " 0.0010192928602918983,\n",
+ " 0.0004998156800866127,\n",
+ " 0.00017007827409543097,\n",
+ " 0.00027306086849421263,\n",
+ " -0.0003577802563086152,\n",
+ " 0.00010865749936783686,\n",
+ " 0.0016894672298803926,\n",
+ " 0.001394396647810936,\n",
+ " 0.000438451737863943,\n",
+ " 0.0012146277585998178,\n",
+ " 0.001263730926439166,\n",
+ " 0.00041775539284572005,\n",
+ " 0.0006478838622570038,\n",
+ " 0.0009950028033927083,\n",
+ " -0.00032780837500467896,\n",
+ " -4.257994442014024e-05,\n",
+ " 0.00012082292960258201,\n",
+ " 4.263331720721908e-05,\n",
+ " 0.0009954365668818355,\n",
+ " 0.0010578327346593142,\n",
+ " 0.0027374697383493185,\n",
+ " 0.002077269135043025,\n",
+ " 0.0004953546449542046,\n",
+ " 0.0011608977802097797,\n",
+ " 0.0013917043106630445,\n",
+ " 0.0004589936579577625,\n",
+ " 0.0008491466287523508,\n",
+ " 0.0007539268117398024,\n",
+ " -0.0005352099542506039,\n",
+ " 0.00020500858954619616,\n",
+ " 0.0001263306912733242,\n",
+ " -0.0008703713538125157,\n",
+ " -0.0006537431618198752,\n",
+ " 7.41914554964751e-05,\n",
+ " 0.00024305509577970952,\n",
+ " -0.00011593665840337053,\n",
+ " 0.0006052966928109527,\n",
+ " 0.0007660831324756145,\n",
+ " 0.0002746870741248131,\n",
+ " 0.0011140070855617523,\n",
+ " -0.000739841372705996,\n",
+ " -0.0016692888457328081,\n",
+ " 0.0014309883117675781,\n",
+ " 0.0017111749621108174,\n",
+ " 0.001434566918760538,\n",
+ " 0.0014021837851032615,\n",
+ " -0.002111851004883647,\n",
+ " -0.0021035680547356606,\n",
+ " -0.0021263775415718555,\n",
+ " -0.000856046041008085,\n",
+ " 0.0005876359064131975,\n",
+ " -0.0016846070066094398,\n",
+ " 6.702119571855292e-05,\n",
+ " -0.0009842758299782872,\n",
+ " -0.001484620152041316,\n",
+ " 0.00021184812067076564,\n",
+ " -0.0006875809049233794,\n",
+ " -0.0010604611597955227,\n",
+ " 0.0004096347256563604,\n",
+ " 0.0010021445341408253,\n",
+ " 0.0006596632301807404,\n",
+ " 0.0015174916479736567,\n",
+ " 0.002064660657197237,\n",
+ " 0.0022351485677063465,\n",
+ " 0.0009136894368566573,\n",
+ " -0.0006709728040732443,\n",
+ " -0.0022931592538952827,\n",
+ " -0.0014806658728048205,\n",
+ " -0.0008752651629038155,\n",
+ " -0.00196358235552907,\n",
+ " -0.00037992841680534184,\n",
+ " 0.0019777643028646708,\n",
+ " 0.0031013928819447756,\n",
+ " 0.0027568847872316837,\n",
+ " 0.0008312893914990127,\n",
+ " 0.001980577362701297,\n",
+ " 0.00514540309086442,\n",
+ " 0.0042906892485916615,\n",
+ " 0.0027199434116482735,\n",
+ " -2.3344491637544706e-05,\n",
+ " -0.0013805533526465297,\n",
+ " -0.0026674908585846424,\n",
+ " -0.0053472924046218395,\n",
+ " -0.002900511957705021,\n",
+ " -0.00025964141241274774,\n",
+ " 0.0011381393996998668,\n",
+ " -5.722007335862145e-05,\n",
+ " -0.002743817400187254,\n",
+ " -0.0008117245743051171,\n",
+ " 0.0018728425493463874,\n",
+ " 0.00189328717533499,\n",
+ " 0.0026418238412588835,\n",
+ " 0.004361518658697605,\n",
+ " 0.0017181691946461797,\n",
+ " 2.1936046323389746e-05,\n",
+ " 0.0019116237526759505,\n",
+ " 0.0004335778357926756,\n",
+ " -0.002144487341865897,\n",
+ " -0.001386212301440537,\n",
+ " -0.0018046348122879863,\n",
+ " -0.0034236654173582792,\n",
+ " -0.00126219866797328,\n",
+ " -0.0012611555866897106,\n",
+ " -0.0031544039957225323,\n",
+ " -0.0017232396639883518,\n",
+ " -0.0009999710600823164,\n",
+ " 0.0022580523509532213,\n",
+ " 0.0005901839467696846,\n",
+ " 0.00036363195977173746,\n",
+ " 0.0028780410066246986,\n",
+ " 0.0012541399337351322,\n",
+ " 0.002275055041536689,\n",
+ " 0.0023796267341822386,\n",
+ " 0.004668164066970348,\n",
+ " 0.003921502735465765,\n",
+ " 0.00357347191311419,\n",
+ " 0.004006227478384972,\n",
+ " 0.004892115481197834,\n",
+ " 0.004437305964529514,\n",
+ " 0.002796204760670662,\n",
+ " -0.000325049739331007,\n",
+ " 0.0011635480914264917,\n",
+ " 0.004252056125551462,\n",
+ " -0.0025076926685869694,\n",
+ " -0.003763149958103895,\n",
+ " 0.00044993788469582796,\n",
+ " 0.00025546521646901965,\n",
+ " -0.0031808114144951105,\n",
+ " -0.003675021231174469,\n",
+ " -0.000809724151622504,\n",
+ " -0.000915110285859555,\n",
+ " -0.007939192466437817,\n",
+ " -0.004049263428896666,\n",
+ " 0.0013845019275322556,\n",
+ " -0.00323904724791646,\n",
+ " -0.004621794912964106,\n",
+ " -0.0025307759642601013,\n",
+ " -0.00010226616723230109,\n",
+ " 0.0007833907147869468,\n",
+ " 0.0008597121341153979,\n",
+ " 0.0008234807755798101,\n",
+ " 0.0024294722825288773,\n",
+ " 0.003209137124940753,\n",
+ " 0.0030507356859743595,\n",
+ " 0.002225461881607771,\n",
+ " 0.002880323212593794,\n",
+ " 0.005131181329488754,\n",
+ " 0.0019125064136460423,\n",
+ " 0.0049330065958201885,\n",
+ " 0.006489843595772982,\n",
+ " 0.0044584753923118114,\n",
+ " 0.0018666564719751477,\n",
+ " -0.00013181346002966166,\n",
+ " 0.00426473468542099,\n",
+ " 0.001396672334522009,\n",
+ " -0.0009538118029013276,\n",
+ " -0.0005206997157074511,\n",
+ " -0.0016725135501474142,\n",
+ " -0.004032398108392954,\n",
+ " -0.0021807688754051924,\n",
+ " -0.00260869599878788,\n",
+ " -0.003425900824368,\n",
+ " 0.00018642147188074887,\n",
+ " 0.0036050663329660892,\n",
+ " 0.0037715614307671785,\n",
+ " 0.005865955725312233,\n",
+ " 0.007344881538301706,\n",
+ " 0.0036000474356114864,\n",
+ " 0.000571330776438117,\n",
+ " 0.003866515588015318,\n",
+ " 0.0072343540377914906,\n",
+ " 0.00563875213265419,\n",
+ " -0.0002649538218975067,\n",
+ " -0.005829600151628256,\n",
+ " -0.00565269123762846,\n",
+ " -0.008510109968483448,\n",
+ " -0.00723476754501462,\n",
+ " -0.004950092639774084,\n",
+ " 0.001261120312847197,\n",
+ " 0.004188567865639925,\n",
+ " 0.0017713976558297873,\n",
+ " -7.596216164529324e-05,\n",
+ " 0.0030626191291958094,\n",
+ " 0.0074457633309066296,\n",
+ " 0.008085927926003933,\n",
+ " 0.003596837632358074,\n",
+ " 0.0019349795766174793,\n",
+ " 0.0019637001678347588,\n",
+ " -0.0013221619883552194,\n",
+ " -0.0016231605550274253,\n",
+ " -0.001801994745619595,\n",
+ " 0.0007086319965310395,\n",
+ " 0.0026926910504698753,\n",
+ " 0.0063539170660078526,\n",
+ " 0.0052721803076565266,\n",
+ " 0.003510240465402603,\n",
+ " 0.006446580868214369,\n",
+ " 0.005111962091177702,\n",
+ " 0.000969595042988658,\n",
+ " 0.0015889930073171854,\n",
+ " 0.0025796459522098303,\n",
+ " -0.00019153217726852745,\n",
+ " 0.0007438616594299674,\n",
+ " 0.002137701725587249,\n",
+ " 0.0005322007928043604,\n",
+ " 0.003552383277565241,\n",
+ " 0.0018470295472070575,\n",
+ " -0.0007750779041089118,\n",
+ " -0.006228339858353138,\n",
+ " -0.0028317419346421957,\n",
+ " 0.0012696891790255904,\n",
+ " 0.0008330129785463214,\n",
+ " 0.006030096672475338,\n",
+ " 0.004263687878847122,\n",
+ " -0.0009502239408902824,\n",
+ " 0.0008025714196264744,\n",
+ " 0.00041490403236821294,\n",
+ " -0.0019697751849889755,\n",
+ " 0.003350939368829131,\n",
+ " 0.0012459054123610258,\n",
+ " 0.0015302429674193263,\n",
+ " 0.002392896916717291,\n",
+ " 0.0017736359732225537,\n",
+ " -0.00011112567881355062,\n",
+ " 0.00029038728098385036,\n",
+ " -0.0017271270044147968,\n",
+ " -0.005580520257353783,\n",
+ " -0.0035973184276372194,\n",
+ " 0.001248177606612444,\n",
+ " 0.0017313899006694555,\n",
+ " 0.0039431070908904076,\n",
+ " 0.00856277160346508,\n",
+ " -0.003626560792326927,\n",
+ " -0.01665525510907173,\n",
+ " -0.005408600904047489,\n",
+ " -0.01286662369966507,\n",
+ " -0.0024772665929049253,\n",
+ " 0.02543102391064167,\n",
+ " 0.03857928514480591,\n",
+ " 0.0779576227068901,\n",
+ " 0.07304054498672485,\n",
+ " 0.0443759448826313,\n",
+ " 0.030988572165369987,\n",
+ " 0.025531504303216934,\n",
+ " 0.0261060893535614,\n",
+ " 0.017985863611102104,\n",
+ " 0.012243611738085747,\n",
+ " -0.004239113535732031,\n",
+ " -0.021061595529317856,\n",
+ " -0.021478068083524704,\n",
+ " -0.03779037669301033,\n",
+ " -0.034702591598033905,\n",
+ " 0.0029765113722532988,\n",
+ " 0.014112338423728943,\n",
+ " -0.004325758200138807,\n",
+ " -0.01591174677014351,\n",
+ " -0.004326132126152515,\n",
+ " -0.004026176407933235,\n",
+ " -0.0028432237450033426,\n",
+ " 0.033994704484939575,\n",
+ " 0.04653646796941757,\n",
+ " 0.01976642571389675,\n",
+ " 0.01324963103979826,\n",
+ " 0.030820587649941444,\n",
+ " 0.030942674726247787,\n",
+ " 0.02831321395933628,\n",
+ " 0.03134569525718689,\n",
+ " 0.016325104981660843,\n",
+ " -0.0001470379502279684,\n",
+ " -0.008936171419918537,\n",
+ " 0.004447208717465401,\n",
+ " 0.00021240688511170447,\n",
+ " -0.0014451565220952034,\n",
+ " 0.005282992031425238,\n",
+ " -0.009163286536931992,\n",
+ " -0.020548705011606216,\n",
+ " -0.014822587370872498,\n",
+ " -0.010262718424201012,\n",
+ " -0.004410305060446262,\n",
+ " 0.0005204321932978928,\n",
+ " -0.010698553174734116,\n",
+ " -0.011935777962207794,\n",
+ " -0.016313789412379265,\n",
+ " -0.016086895018815994,\n",
+ " -0.006026001181453466,\n",
+ " -0.005233586300164461,\n",
+ " -0.006422878243029118,\n",
+ " 0.0016233256319537759,\n",
+ " 0.003643572796136141,\n",
+ " -0.0001913852320285514,\n",
+ " -0.01898811198771,\n",
+ " -0.025157494470477104,\n",
+ " -0.014096292667090893,\n",
+ " -0.01694774627685547,\n",
+ " -0.018065348267555237,\n",
+ " -0.01744413562119007,\n",
+ " -0.019032346084713936,\n",
+ " -0.011644937098026276,\n",
+ " -0.01446110662072897,\n",
+ " -0.0063341292552649975,\n",
+ " 0.007109663914889097,\n",
+ " 0.0036720875650644302,\n",
+ " 0.005605868063867092,\n",
+ " -0.004630518611520529,\n",
+ " -0.011621602810919285,\n",
+ " -0.004361990373581648,\n",
+ " -0.0038554947823286057,\n",
+ " -0.0015881119761615992,\n",
+ " 0.0061269644647836685,\n",
+ " 0.013539955951273441,\n",
+ " 0.017379332333803177,\n",
+ " 0.014455473981797695,\n",
+ " 0.019328253343701363,\n",
+ " 0.01681414619088173,\n",
+ " 0.02761642262339592,\n",
+ " 0.03249058127403259,\n",
+ " 0.02243793196976185,\n",
+ " 0.025095470249652863,\n",
+ " 0.019813809543848038,\n",
+ " 0.013172836042940617,\n",
+ " 0.02501184307038784,\n",
+ " 0.02535036951303482,\n",
+ " 0.01975289173424244,\n",
+ " 0.02520027942955494,\n",
+ " 0.026372632011771202,\n",
+ " 0.025743328034877777,\n",
+ " 0.011118150316178799,\n",
+ " 0.003902260446920991,\n",
+ " 0.0039011305198073387,\n",
+ " -0.007371435407549143,\n",
+ " -0.009137284010648727,\n",
+ " 0.0016474969452247024,\n",
+ " 0.011659868992865086,\n",
+ " 0.010708037763834,\n",
+ " 0.008485903963446617,\n",
+ " 0.010129689238965511,\n",
+ " 0.005752232391387224,\n",
+ " 0.0033228867687284946,\n",
+ " -0.028027649968862534,\n",
+ " -0.04102279618382454,\n",
+ " -0.039976559579372406,\n",
+ " -0.03991375491023064,\n",
+ " -0.03151653707027435,\n",
+ " -0.04483499750494957,\n",
+ " -0.047068916261196136,\n",
+ " -0.026874028146266937,\n",
+ " -0.014819937758147717,\n",
+ " -0.007974923588335514,\n",
+ " 0.000824518094304949,\n",
+ " 0.001355901942588389,\n",
+ " 0.0062545244581997395,\n",
+ " 0.004535945598036051,\n",
+ " 0.005761114414781332,\n",
+ " 0.0035676888655871153,\n",
+ " 0.009243931621313095,\n",
+ " -0.0019145150436088443,\n",
+ " -0.012563463300466537,\n",
+ " -0.004750219639390707,\n",
+ " -0.010330742225050926,\n",
+ " -0.008525996468961239,\n",
+ " -0.005476224701851606,\n",
+ " 0.003242050064727664,\n",
+ " 0.013226129114627838,\n",
+ " 0.012910903431475163,\n",
+ " 0.00945615116506815,\n",
+ " 0.011088164523243904,\n",
+ " 0.01975233480334282,\n",
+ " 0.017904292792081833,\n",
+ " 0.021685075014829636,\n",
+ " 0.023444892838597298,\n",
+ " 0.02632923424243927,\n",
+ " 0.02718733251094818,\n",
+ " 0.0274700578302145,\n",
+ " 0.030974460765719414,\n",
+ " 0.027698388323187828,\n",
+ " 0.030338527634739876,\n",
+ " 0.01759916916489601,\n",
+ " 0.010145828127861023,\n",
+ " 0.010785859078168869,\n",
+ " 0.012820263393223286,\n",
+ " 0.001039436087012291,\n",
+ " 0.0014263009652495384,\n",
+ " 0.011243565008044243,\n",
+ " 0.00405132444575429,\n",
+ " -0.0002918285899795592,\n",
+ " 0.003985886927694082,\n",
+ " 0.0008974622469395399,\n",
+ " -0.00016717765538487583,\n",
+ " 0.004695919342339039,\n",
+ " -0.001512925955466926,\n",
+ " 0.006159887183457613,\n",
+ " 0.011171053163707256,\n",
+ " 0.0033837193623185158,\n",
+ " 0.013440846465528011,\n",
+ " 0.020161520689725876,\n",
+ " 0.005399319808930159,\n",
+ " -0.0008950530900619924,\n",
+ " 0.0009767073206603527,\n",
+ " 0.0018716963240876794,\n",
+ " -0.005152743775397539,\n",
+ " -0.008394423872232437,\n",
+ " -0.007507639471441507,\n",
+ " 0.007374136708676815,\n",
+ " 0.013064488768577576,\n",
+ " 0.01702091470360756,\n",
+ " 0.03331666812300682,\n",
+ " 0.039364565163850784,\n",
+ " 0.031202293932437897,\n",
+ " 0.0208040252327919,\n",
+ " 0.011201268061995506,\n",
+ " 0.0033627592492848635,\n",
+ " -0.0019646009895950556,\n",
+ " -0.0031524328514933586,\n",
+ " 0.0004363589396234602,\n",
+ " -0.004480340518057346,\n",
+ " -0.0004067709669470787,\n",
+ " 0.005463654175400734,\n",
+ " 0.010541819967329502,\n",
+ " 0.016026580706238747,\n",
+ " 0.017720546573400497,\n",
+ " 0.007632751949131489,\n",
+ " -0.002935093594714999,\n",
+ " -0.003704577684402466,\n",
+ " -0.004913324024528265,\n",
+ " -0.010824184864759445,\n",
+ " -0.011137007735669613,\n",
+ " -0.012465090490877628,\n",
+ " -0.015075570903718472,\n",
+ " -0.021624021232128143,\n",
+ " -0.02208191715180874,\n",
+ " -0.019536105915904045,\n",
+ " -0.01679953746497631,\n",
+ " -0.013453934341669083,\n",
+ " -0.013365051709115505,\n",
+ " -0.01675538904964924,\n",
+ " -0.018372545018792152,\n",
+ " -0.014688055031001568,\n",
+ " -0.014568314887583256,\n",
+ " -0.0126899229362607,\n",
+ " -0.012059771455824375,\n",
+ " -0.013853365555405617,\n",
+ " -0.013614390976727009,\n",
+ " -0.012666240334510803,\n",
+ " -0.013986391946673393,\n",
+ " -0.013049651868641376,\n",
+ " -0.01190341915935278,\n",
+ " -0.011362291872501373,\n",
+ " -0.010145120322704315,\n",
+ " -0.01028529368340969,\n",
+ " -0.010536414571106434,\n",
+ " -0.009143738076090813,\n",
+ " -0.009089595638215542,\n",
+ " -0.008962639607489109,\n",
+ " -0.006675417535007,\n",
+ " -0.0060259681195020676,\n",
+ " -0.006210292223840952,\n",
+ " -0.005486504174768925,\n",
+ " -0.005272102542221546,\n",
+ " -0.004794448148459196,\n",
+ " -0.00503335427492857,\n",
+ " -0.005223392974585295,\n",
+ " -0.00449112243950367,\n",
+ " -0.0045046512968838215,\n",
+ " -0.0036722649820148945,\n",
+ " -0.0028255938086658716,\n",
+ " -0.0020174665842205286,\n",
+ " -0.0008867529104463756,\n",
+ " -0.001887730322778225,\n",
+ " -0.0016902934294193983,\n",
+ " -0.0016251194756478071,\n",
+ " -0.001935891923494637,\n",
+ " -0.0016856655711308122,\n",
+ " -0.0014167025219649076,\n",
+ " -0.0005961601855233312,\n",
+ " -0.0016614252235740423,\n",
+ " -0.002028528368100524,\n",
+ " -0.0007097439374774694,\n",
+ " -0.0002931955095846206,\n",
+ " -0.0007703102310188115,\n",
+ " -0.0011331827845424414,\n",
+ " -0.0010590737219899893,\n",
+ " -0.0007797644939273596,\n",
+ " -0.0002531334466766566,\n",
+ " -0.0007386361830867827,\n",
+ " -0.0009914034744724631,\n",
+ " -0.001182180130854249,\n",
+ " -0.0009830452036112547,\n",
+ " -0.0006057446589693427,\n",
+ " -0.0011627126950770617,\n",
+ " -0.0008252001716755331,\n",
+ " 0.0006755380891263485,\n",
+ " 0.00019946102111134678,\n",
+ " 0.00022755331883672625,\n",
+ " 0.00043272849870845675,\n",
+ " -0.00024512302479706705,\n",
+ " -0.0009981408948078752,\n",
+ " -0.0004874107544310391,\n",
+ " -0.0002885085705202073,\n",
+ " -0.001031199935823679,\n",
+ " -0.000457369489595294,\n",
+ " -3.1573144951835275e-05,\n",
+ " 0.0005433136248029768,\n",
+ " 0.0006195642636157572,\n",
+ " 0.0005670224200002849,\n",
+ " 0.0008731040288694203,\n",
+ " -0.00020871804736088961,\n",
+ " 3.674410254461691e-05,\n",
+ " 0.00026626387261785567,\n",
+ " 0.0001170631148852408,\n",
+ " 9.308507287641987e-05,\n",
+ " 6.12013682257384e-05,\n",
+ " 0.00012408032489474863,\n",
+ " 0.00032900928636081517,\n",
+ " 0.0004148167499806732,\n",
+ " 0.0004404608625918627,\n",
+ " 0.0004906021640636027,\n",
+ " 0.00036237112362869084,\n",
+ " 0.0009840368293225765,\n",
+ " 0.0008120417478494346,\n",
+ " 0.00023984418658073992,\n",
+ " 0.0003541646874509752,\n",
+ " 3.661405207822099e-05,\n",
+ " 4.717326373793185e-05,\n",
+ " -0.00013178061635699123,\n",
+ " 0.0006034260732121766,\n",
+ " 0.000637341698165983,\n",
+ " 0.0002825457777362317,\n",
+ " 0.000909725611563772,\n",
+ " 0.001249623717740178,\n",
+ " 0.0008603373426012695,\n",
+ " 0.0005345637327991426,\n",
+ " 0.0008684125496074557,\n",
+ " 0.00035533448681235313,\n",
+ " 0.00015303611871786416,\n",
+ " 0.0006417471449822187,\n",
+ " 0.0005630674422718585,\n",
+ " 0.0004693359660450369,\n",
+ " 0.00045640289317816496,\n",
+ " 0.0006442577578127384,\n",
+ " 0.0007673976360820234,\n",
+ " 0.0006895225960761309,\n",
+ " 0.00039901313721202314,\n",
+ " 0.0005476705264300108,\n",
+ " 0.000606244255322963,\n",
+ " 0.0007479285704903305,\n",
+ " 0.0007109530852176249,\n",
+ " 0.00040047476068139076,\n",
+ " 0.0004297301929909736,\n",
+ " 0.0007463843794539571,\n",
+ " 0.0006467739003710449,\n",
+ " 0.0006657696794718504,\n",
+ " 0.0005741325439885259,\n",
+ " 0.0005020728567615151,\n",
+ " 0.0006728451116941869,\n",
+ " 0.0005711198900826275,\n",
+ " 0.0005149278440512717,\n",
+ " 0.0007238130201585591,\n",
+ " 0.0005309715634211898,\n",
+ " 0.00047598921810276806,\n",
+ " 0.0007293385569937527,\n",
+ " 0.0007677751127630472,\n",
+ " 0.0008045271970331669,\n",
+ " 0.0009836711687967181,\n",
+ " 0.0009469626238569617,\n",
+ " 0.0008611425873823464,\n",
+ " 0.0006562943453900516,\n",
+ " 0.0005742606008425355,\n",
+ " 0.0004597051884047687,\n",
+ " 0.0007511923904530704,\n",
+ " 0.00018865351739805192,\n",
+ " 0.0004445254453457892,\n",
+ " 0.0003657930647023022,\n",
+ " 0.0002196271816501394,\n",
+ " 0.00017099893011618406,\n",
+ " 0.0003212476149201393,\n",
+ " ...],\n",
+ " 'input_length': 67392,\n",
+ " 'labels': [16,\n",
+ " 27,\n",
+ " 22,\n",
+ " 0,\n",
+ " 7,\n",
+ " 16,\n",
+ " 0,\n",
+ " 15,\n",
+ " 11,\n",
+ " 21,\n",
+ " 21,\n",
+ " 29,\n",
+ " 29,\n",
+ " 16,\n",
+ " 0,\n",
+ " 22,\n",
+ " 3,\n",
+ " 18,\n",
+ " 3,\n",
+ " 23,\n",
+ " 13,\n",
+ " 21,\n",
+ " 7,\n",
+ " 21,\n",
+ " 21,\n",
+ " 3,\n",
+ " 0,\n",
+ " 21,\n",
+ " 11,\n",
+ " 16,\n",
+ " 23,\n",
+ " 3,\n",
+ " 0,\n",
+ " 3,\n",
+ " 23,\n",
+ " 22,\n",
+ " 3]}"
+ ]
+ },
+ "execution_count": 16,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "#common_voice_test_audio[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "id": "9124b4b0",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [],
+ "source": [
+ "def evaluate(batch):\n",
+ " inputs = processor(batch[\"input_values\"], sampling_rate=16_000, return_tensors=\"pt\", padding=True)\n",
+ "\n",
+ " with torch.no_grad():\n",
+ " logits = model(inputs.input_values.to(\"cuda\"), attention_mask=inputs.attention_mask.to(\"cuda\")).logits\n",
+ "\n",
+ " pred_ids = torch.argmax(logits, dim=-1)\n",
+ " batch[\"pred_strings\"] = processor.batch_decode(pred_ids)\n",
+ " return batch\n",
+ "\n",
+ "def evaluate_with_lm(batch):\n",
+ " inputs = processor(batch[\"input_values\"], sampling_rate=16_000, return_tensors=\"pt\", padding=True)\n",
+ "\n",
+ " with torch.no_grad():\n",
+ " logits = model(inputs.input_values.to(\"cuda\"), attention_mask=inputs.attention_mask.to(\"cuda\")).logits\n",
+ " \n",
+ " batch[\"pred_strings\"] = processor.batch_decode(logits.cpu().numpy()).text\n",
+ " return batch\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "id": "039e8a8e",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [],
+ "source": [
+ "wer_metric = load_metric(\"wer\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "94acd542",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "b49d6621f4d64d1d94aeba87e7718eb5",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ " 0%| | 0/200 [00:00, ?ba/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "#sample_1 = common_voice_test_audio.select([i for i in range(100)])\n",
+ "#result = sample_1.map(evaluate, batched=True, batch_size=8)\n",
+ "result_with_lm = common_voice_test_audio.map(evaluate_with_lm, batched=True, batch_size=8)\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "id": "1dea4e88",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "1. result\n",
+ "pred: nyt en missään tapauksessa sinua auttaa\n",
+ "sentence: nyt en missään tapauksessa sinua auta\n",
+ "#################\n",
+ "2. result\n",
+ "pred: emme tarvitsisi äänestä toista vihonnista\n",
+ "sentence: emme tarvitsisi hänestä toista vihollista\n",
+ "#################\n",
+ "3. result\n",
+ "pred: matti vanha sen isä oli dosentti tatuvanhanen ja äiti rouva annitiihanen\n",
+ "sentence: matti vanhasen isä oli dosentti tatu vanhanen ja äiti rouva anni tiihonen\n",
+ "#################\n",
+ "4. result\n",
+ "pred: äänestin henkilökohtaisesti näiden tarkistusten puolesta\n",
+ "sentence: äänestin henkilökohtaisesti näiden tarkistusten puolesta\n",
+ "#################\n",
+ "5. result\n",
+ "pred: tunsin oloni loistavaksi kun olin saanut pojan paremmalle tuudelle\n",
+ "sentence: tunsin oloni loistavaksi kun olin saanut pojan paremmalle tuulelle\n",
+ "#################\n",
+ "6. result\n",
+ "pred: ankeriaskantojen elvyttämiseksi on päätetty vähentää ankeriaankalastusta puoleen\n",
+ "sentence: ankeriaskantojen elvyttämiseksi on päätetty vähentää ankeriaankalastusta puoleen\n",
+ "#################\n",
+ "7. result\n",
+ "pred: tämän planeetan olemassaolo saattoi hyvinkin olla hallituksen tiedossa toisin kuin hydruksen olemassaolo\n",
+ "sentence: tämän planeetan olemassaolo saattoi hyvinkin olla hallituksen tiedossa toisin kuin hydruksen olemassaolo\n",
+ "#################\n",
+ "8. result\n",
+ "pred: eikä ilmassakaan havaittu haitallisia kaasuja tai bakteereita\n",
+ "sentence: eikä ilmassakaan havaittu haitallisia kaasuja tai bakteereita\n",
+ "#################\n",
+ "9. result\n",
+ "pred: missäköhän kaikki vaatteeni ovat\n",
+ "sentence: missäköhän kaikki vaatteeni ovat\n",
+ "#################\n",
+ "10. result\n",
+ "pred: tavasta oli suu suru\n",
+ "sentence: talossa oli suuri suru\n",
+ "#################\n"
+ ]
+ }
+ ],
+ "source": [
+ "#### TAKE a look at pred / target\n",
+ "\n",
+ "for i in range(10):\n",
+ " print(str(i +1) + \". result\")\n",
+ " print(\"pred: \" + str(result_with_lm[i][\"pred_strings\"]))\n",
+ " print(\"sentence: \" + str(result_with_lm[i][\"sentence\"]))\n",
+ " print(\"#################\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "id": "34ecefd3",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "WER: 10.813813\n"
+ ]
+ }
+ ],
+ "source": [
+ "#result = test_dataset.map(evaluate, batched=True, batch_size=1)\n",
+ "\n",
+ "print(\"WER: {:2f}\".format(100 * wer_metric.compute(predictions=result_with_lm[\"pred_strings\"], references=result_with_lm[\"sentence\"])))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "3c927fd5",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "source": [
+ " Test from mozilla common_voice v_7_0 directly from hub \n",
+ "Using currently the \"old\" preprocessing and not the \"audio\" method
\", \"…\", \"–\", \"°\", \"´\", \"ʾ\", \"‹\", \"›\", \"©\", \"®\", \"—\", \"→\", \"。\",\n",
+ " \"、\", \"﹂\", \"﹁\", \"‧\", \"~\", \"﹏\", \",\", \"{\", \"}\", \"(\", \")\", \"[\", \"]\", \"【\", \"】\", \"‥\", \"〽\",\n",
+ " \"『\", \"』\", \"〝\", \"〟\", \"⟨\", \"⟩\", \"〜\", \":\", \"!\", \"?\", \"♪\", \"؛\", \"/\", \"\\\\\", \"º\", \"−\", \"^\", \"ʻ\", \"ˆ\"]\n",
+ "\n",
+ "\n",
+ "chars_to_remove_regex = f\"[{re.escape(''.join(CHARS_TO_IGNORE))}]\"\n",
+ "\n",
+ "def remove_special_characters(batch):\n",
+ " batch[\"sentence\"] = re.sub(chars_to_remove_regex, '', batch[\"sentence\"]).lower()\n",
+ " return batch\n",
+ "\n",
+ "common_voice_dataset = common_voice_dataset.map(remove_special_characters)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 27,
+ "id": "396369b6",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "Loading cached processed dataset at /workspace/.cache/huggingface/datasets/mozilla-foundation___common_voice/fi/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba/cache-b66d07bf277a5504.arrow\n"
+ ]
+ }
+ ],
+ "source": [
+ "def resample_audios(batch):\n",
+ " sr = batch['audio']['sampling_rate']\n",
+ " batch['audio']['array'] = F.resample(torch.tensor(batch[\"audio\"][\"array\"]), sr, 16_000).numpy()\n",
+ " return batch\n",
+ "\n",
+ "common_voice_dataset = common_voice_dataset.map(resample_audios)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 28,
+ "id": "2852ca1c",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def prepare_dataset(batch):\n",
+ " batch[\"input_values\"] = processor(batch[\"audio\"][\"array\"], sampling_rate=16000).input_values[0]\n",
+ " batch[\"input_length\"] = len(batch[\"input_values\"])\n",
+ " batch[\"sentence\"] = batch[\"sentence\"]\n",
+ " \n",
+ " with processor.as_target_processor():\n",
+ " batch[\"labels\"] = processor(batch[\"sentence\"]).input_ids\n",
+ " return batch"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 29,
+ "id": "7832bd68",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "58ff04eeda134bec9ffdc7bcf71fc66c",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ " 0%| | 0/1599 [00:00, ?ex/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "common_voice_dataset = common_voice_dataset.map(prepare_dataset)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 30,
+ "id": "75ab8e07",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "wer_metric = load_metric(\"wer\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 31,
+ "id": "7c52f988",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def evaluate_with_lm(batch):\n",
+ " inputs = processor(batch[\"input_values\"], sampling_rate=16_000, return_tensors=\"pt\", padding=True)\n",
+ "\n",
+ " with torch.no_grad():\n",
+ " logits = model(inputs.input_values.to(\"cuda\"), attention_mask=inputs.attention_mask.to(\"cuda\")).logits\n",
+ " \n",
+ " batch[\"pred_strings\"] = processor.batch_decode(logits.cpu().numpy()).text\n",
+ " return batch"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 32,
+ "id": "95ae82dd",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "8c43b96d24ec4942a33e4f8d4e66f8c6",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ " 0%| | 0/200 [00:00, ?ba/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "WER: 13.489499\n"
+ ]
+ }
+ ],
+ "source": [
+ "result_with_lm = common_voice_dataset.map(evaluate_with_lm, batched=True, batch_size=8)\n",
+ "print(\"WER: {:2f}\".format(100 * wer_metric.compute(predictions=result_with_lm[\"pred_strings\"], references=result_with_lm[\"sentence\"])))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "668dc828",
+ "metadata": {},
+ "source": [
+ "\n",
+ " ASR PIPELINE PREDICTIONS (Same kind as in eval.py)
\n",
+ "\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 49,
+ "id": "5302f579",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "Using the latest cached version of the module from /workspace/.cache/huggingface/modules/datasets_modules/datasets/mozilla-foundation--common_voice_7_0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba (last modified on Sun Jan 23 16:17:44 2022) since it couldn't be found locally at mozilla-foundation/common_voice_7_0., or remotely on the Hugging Face Hub.\n",
+ "Reusing dataset common_voice (/workspace/.cache/huggingface/datasets/mozilla-foundation___common_voice/fi/7.0.0/33e08856cfa0d0665e837bcad73ffd920a0bc713ce8c5fffb55dbdf1c084d5ba)\n"
+ ]
+ }
+ ],
+ "source": [
+ "common_voice_dataset = load_dataset(\"mozilla-foundation/common_voice_7_0\", \"fi\", split=\"test\")\n",
+ "\n",
+ "common_voice_dataset = common_voice_dataset.cast_column(\"audio\", Audio(sampling_rate=16_000))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 54,
+ "id": "6c048f8b",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def normalize_text(text: str) -> str:\n",
+ " \"\"\"DO ADAPT FOR YOUR USE CASE. this function normalizes the target text.\"\"\"\n",
+ "\n",
+ " chars_to_ignore_regex = [\",\", \"?\", \"¿\", \".\", \"!\", \"¡\", \";\", \";\", \":\", '\"\"', \"%\", '\"', \"�\", \"ʿ\", \"·\", \"჻\", \"~\", \"՞\",\n",
+ " \"؟\", \"،\", \"।\", \"॥\", \"«\", \"»\", \"„\", \"“\", \"”\", \"「\", \"」\", \"‘\", \"’\", \"《\", \"》\", \"(\", \")\", \"[\", \"]\",\n",
+ " \"{\", \"}\", \"=\", \"`\", \"_\", \"+\", \"<\", \">\", \"…\", \"–\", \"°\", \"´\", \"ʾ\", \"‹\", \"›\", \"©\", \"®\", \"—\", \"→\", \"。\",\n",
+ " \"、\", \"﹂\", \"﹁\", \"‧\", \"~\", \"﹏\", \",\", \"{\", \"}\", \"(\", \")\", \"[\", \"]\", \"【\", \"】\", \"‥\", \"〽\",\n",
+ " \"『\", \"』\", \"〝\", \"〟\", \"⟨\", \"⟩\", \"〜\", \":\", \"!\", \"?\", \"♪\", \"؛\", \"/\", \"\\\\\", \"º\", \"−\", \"^\", \"ʻ\", \"ˆ\"] \n",
+ "\n",
+ "\n",
+ " chars_to_remove_regex = f\"[{re.escape(''.join(chars_to_ignore_regex))}]\"\n",
+ " \n",
+ " \n",
+ " \n",
+ " # remove punctuation\n",
+ " text = re.sub(chars_to_remove_regex, '', text)\n",
+ " \n",
+ " text = text.lower()\n",
+ " \n",
+ " # Let's also make sure we split on all kinds of newlines, spaces, etc...\n",
+ " #text = \" \".join(text.split())\n",
+ " \n",
+ " return text"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 55,
+ "id": "9fa432f2",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# map function to decode audio\n",
+ "def map_to_pred(batch):\n",
+ " prediction = asr(\n",
+ " batch[\"audio\"][\"array\"]\n",
+ " )\n",
+ "\n",
+ " batch[\"prediction\"] = prediction[\"text\"]\n",
+ " batch[\"target\"] = normalize_text(batch[\"sentence\"])\n",
+ " return batch"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 56,
+ "id": "d80cf431",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "4dc38b78128f49938ec47a41be469153",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ " 0%| | 0/1599 [00:00, ?ex/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "/opt/conda/lib/python3.8/site-packages/transformers/pipelines/base.py:976: UserWarning: You seem to be using the pipelines sequentially on GPU. In order to maximize efficiency please use a dataset\n",
+ " warnings.warn(\n"
+ ]
+ }
+ ],
+ "source": [
+ "model_id = \"RASMUS/wav2vec2-xlsr-fi-lm-1B\"\n",
+ "\n",
+ "asr = pipeline(\"automatic-speech-recognition\", model=model_id, device=0)\n",
+ "# run inference on all examples\n",
+ "result = common_voice_dataset.map(map_to_pred, remove_columns=common_voice_dataset.column_names)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 57,
+ "id": "0486bb61",
+ "metadata": {
+ "papermill": {
+ "duration": null,
+ "end_time": null,
+ "exception": null,
+ "start_time": null,
+ "status": "pending"
+ },
+ "tags": []
+ },
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "WER: 27.110258\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(\"WER: {:2f}\".format(100 * wer_metric.compute(predictions=result[\"prediction\"], references=result[\"target\"])))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "id": "6cdf2c33",
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.8.8"
+ },
+ "papermill": {
+ "default_parameters": {},
+ "duration": null,
+ "end_time": null,
+ "environment_variables": {},
+ "exception": null,
+ "input_path": "__notebook__.ipynb",
+ "output_path": "__notebook__.ipynb",
+ "parameters": {},
+ "start_time": "2022-01-04T20:58:19.515266",
+ "version": "2.3.3"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}