{ "cells": [ { "cell_type": "code", "execution_count": 11, "metadata": {}, "outputs": [], "source": [ "import os\n", "import json\n", "from pyspark.sql import SparkSession\n", "import pandas as pd\n", "import polars as pl\n", "from tqdm.auto import tqdm, trange\n", "from concurrent.futures import ThreadPoolExecutor, as_completed\n", "import matplotlib.pyplot as plt\n", "\n", "import torch\n", "import torchvision as tv\n", "from torchvision.transforms import v2\n", "\n", "SCRATCH = r\"/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani\"\n", "DATADIR = r\"/home/IITB/ai-at-ieor/23m1521/datasets/Vaani\"\n", "JSON_PATH = os.path.join(DATADIR, \"Vaani_IIsc_Artpark_Full_Data.json\")\n", "IMAGES_PATH = os.path.join(SCRATCH, \"Images\")\n", "IMAGES_PARQUETS = os.path.join(SCRATCH, \"images_parquets\")\n", "AUDIO_URLS = \"audio_urls.txt\"\n", "IMAGES_URLS = \"images_urls.txt\"\n", "IMAGE_ROOT_URL = 'https://vaani.iisc.ac.in/'\n", "METADATA_PATH = r\"/home/IITB/ai-at-ieor/23m1521/ashish/MTP/Vaani/Vaani-Images-Audio-MetaData.parquet\"" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Files found: 128807\n" ] } ], "source": [ "def walkDIR(folder_path, include=None):\n", " file_list = []\n", " for root, _, files in os.walk(folder_path):\n", " for file in files:\n", " if include is None or any(file.endswith(ext) for ext in include):\n", " file_list.append(os.path.join(root, file))\n", " print(\"Files found:\", len(file_list))\n", " return file_list\n", "\n", "files = walkDIR(IMAGES_PATH, include=['.png', '.jpeg', '.jpg'])" ] }, { "cell_type": "code", "execution_count": 8, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "['/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_TehriGarhwal-SPECIFIC_00863.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Budaun-SPECIFIC_00129.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Jashpur-SPECIFIC_00102.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Saharsa-SPECIFIC_00905.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Purulia-SPECIFIC_00971.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Samastipur-SPECIFIC_00274.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_PaschimMedinipur-SPECIFIC_00501.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Sahebganj-SPECIFIC_00315.jpg',\n", " '/scratch/IITB/ai-at-ieor/23m1521/datasets/Vaani/Images/IISc_VaaniProject_Sarguja-SPECIFIC_00485.jpg']" ] }, "execution_count": 8, "metadata": {}, "output_type": "execute_result" } ], "source": [ "files[:10]" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "class MnistDataset(torch.utils.data.Dataset):\n", " def __init__(\n", " self,\n", " data,\n", " im_size\n", " ):\n", " if isinstance(data, str):\n", " self.data = pd.read_csv(data)\n", " elif isinstance(data, pd.DataFrame):\n", " self.data = data\n", " else:\n", " raise ValueError(\"The `data` argument must be a string (CSV file path) or a Pandas DataFrame.\")\n", " \n", " self.im_size = im_size\n", "\n", " def __len__(self):\n", " return len(self.data)\n", "\n", " def __getitem__(self, idx):\n", " row = self.data.iloc[idx]\n", " image_path = row['image_path']\n", " label = int(row['label'])\n", "\n", " image = tv.io.decode_image(image_path, mode='RGB')\n", " image = v2.Resize(self.im_size)(image)\n", " image = v2.ToDtype(torch.float32, scale=True)(image)\n", " image = 2*image - 1\n", "\n", " return image, label" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "df = pd.read_parquet(METADATA_PATH)" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "application/vnd.microsoft.datawrangler.viewer.v0+json": { "columns": [ { "name": "index", "rawType": "int64", "type": "integer" }, { "name": "image_name", "rawType": "object", "type": "string" }, { "name": "state", "rawType": "object", "type": "string" }, { "name": "district", "rawType": "object", "type": "string" }, { "name": "gender", "rawType": "object", "type": "string" }, { "name": "audio_language", "rawType": "object", "type": "string" }, { "name": "audio_name", "rawType": "object", "type": "string" } ], "conversionMethod": "pd.DataFrame", "ref": "5cf67481-51db-4753-9850-4b244b697322", "rows": [ [ "0", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00559.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885658_MRACO_32387_0_10237.wav" ], [ "1", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00404.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885688_MRACH_323525_10676_14796.wav" ], [ "2", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00365.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885773_MRACS_92011_0_13216.wav" ], [ "3", "Images/IISc_VaaniProject_GENERIC_0073.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885423_MRABC_323380_11266_20399.wav" ], [ "4", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01252.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10886492_MRACH_80994_515_9950.wav" ], [ "5", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00369.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885712_MRACLT_323569_13981_21501.wav" ], [ "6", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00404.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885688_MRACH_323525_0_5754.wav" ], [ "7", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00137.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885641_MRACLT_323571_12610_21310.wav" ], [ "8", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01082.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885477_MRACH_323524_12546_20926.wav" ], [ "9", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01272.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885675_MRACH_80188_9499_19963.wav" ], [ "10", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01244.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885904_MRACLT_323572_818_11691.wav" ], [ "11", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00137.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885641_MRACLT_323571_498_12290.wav" ], [ "12", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01082.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885477_MRACH_323524_1655_12345.wav" ], [ "13", "Images/IISc_VaaniProject_GENERIC_0073.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885423_MRABC_323380_200_11206.wav" ], [ "14", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00034.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10886672_MRADM_236186_498_9130.wav" ], [ "15", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00404.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885688_MRACH_323525_6190_10263.wav" ], [ "16", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00365.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885773_MRACS_92011_13230_20402.wav" ], [ "17", "Images/IISc_VaaniProject_GENERIC_0179.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10881852_KTCMMAO_300177_498_15241.wav" ], [ "18", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00034.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10886672_MRADM_236186_9170_20846.wav" ], [ "19", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00997.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885503_MRACH_323530_0_4589.wav" ], [ "20", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00559.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885658_MRACO_32387_10473_19952.wav" ], [ "21", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00997.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885503_MRACH_323530_4816_19125.wav" ], [ "22", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01244.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885904_MRACLT_323572_12033_19988.wav" ], [ "23", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_01252.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10886492_MRACH_80994_9950_20461.wav" ], [ "24", "Images/IISc_VaaniProject_GENERIC_0179.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10881852_KTCMMAO_300177_15841_20461.wav" ], [ "25", "Images/IISc_VaaniProject_GENERIC_1041.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11157562_UPVNFR_142622_13_10446.wav" ], [ "26", "Images/IISc_VaaniProject_GENERIC_1037.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160952_UPVNTA_123296_0_12723.wav" ], [ "27", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00369.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885712_MRACLT_323569_498_13741.wav" ], [ "28", "Images/IISc_VaaniProject_GENERIC_0980.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160070_UPVNHT_161133_2_11717.wav" ], [ "29", "Images/IISc_VaaniProject_Aurangabad-SPECIFIC_00404.jpg", "Maharashtra", "Aurangabad", "female", "Marathi", "Audios/Aurangabad/IISc_VaaniProject_S_Maharashtra_Aurangabad_95220_10885688_MRACH_323525_15090_20194.wav" ], [ "30", "Images/IISc_VaaniProject_GENERIC_0857.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11157614_TGNLFLM_14947_11483_17575.wav" ], [ "31", "Images/IISc_VaaniProject_GENERIC_0784.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11161711_UPVNREI_136144_0_11475.wav" ], [ "32", "Images/IISc_VaaniProject_GENERIC_0991.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11159902_UPVNML_191445_0_10486.wav" ], [ "33", "Images/IISc_VaaniProject_GENERIC_1037.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160952_UPVNTA_123296_12723_14915.wav" ], [ "34", "Images/IISc_VaaniProject_GENERIC_1004.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11159231_UPVNHC_147120_0_9681.wav" ], [ "35", "Images/IISc_VaaniProject_GENERIC_0798.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11158013_UPVNFN_199962_0_12217.wav" ], [ "36", "Images/IISc_VaaniProject_GENERIC_1061.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11159169_TGNLSL_79868_2_11538.wav" ], [ "37", "Images/IISc_VaaniProject_GENERIC_0902.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11158905_UPVNIM_17694_0_9213.wav" ], [ "38", "Images/IISc_VaaniProject_GENERIC_1028.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11158685_UPVNEX_152314_0_11230.wav" ], [ "39", "Images/IISc_VaaniProject_GENERIC_0850.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11157526_UPVNHO_17386_0_10631.wav" ], [ "40", "Images/IISc_VaaniProject_GENERIC_0723.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160293_UPVNLK_136180_0_10991.wav" ], [ "41", "Images/IISc_VaaniProject_GENERIC_0857.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11157614_TGNLFLM_14947_565_11483.wav" ], [ "42", "Images/IISc_VaaniProject_GENERIC_1033.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160176_UPVNGOB_3297_107_14754.wav" ], [ "43", "Images/IISc_VaaniProject_GENERIC_0824.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160850_UPVNRI_11356_0_11078.wav" ], [ "44", "Images/IISc_VaaniProject_GENERIC_0830.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11158620_TGNLST_11812_0_9545.wav" ], [ "45", "Images/IISc_VaaniProject_GENERIC_0923.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160686_UPVNMO_145096_0_12159.wav" ], [ "46", "Images/IISc_VaaniProject_GENERIC_0797.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11160624_UPVNSU_55591_2_10857.wav" ], [ "47", "Images/IISc_VaaniProject_Solapur-SPECIFIC_00231.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_72631_9964768_MRSREI_271382_0_12602.wav" ], [ "48", "Images/IISc_VaaniProject_GENERIC_0991.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_102552_11159902_UPVNML_191445_10486_13559.wav" ], [ "49", "Images/IISc_VaaniProject_Solapur-SPECIFIC_01764.jpg", "Maharashtra", "Solapur", "female", "Marathi", "Audios/Solapur/IISc_VaaniProject_S_Maharashtra_Solapur_72631_9962743_MRSOTHER_274077_5208_16951.wav" ] ], "shape": { "columns": 6, "rows": 9584932 } }, "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
image_namestatedistrictgenderaudio_languageaudio_name
0Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0...MaharashtraAurangabadfemaleMarathiAudios/Aurangabad/IISc_VaaniProject_S_Maharash...
1Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0...MaharashtraAurangabadfemaleMarathiAudios/Aurangabad/IISc_VaaniProject_S_Maharash...
2Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0...MaharashtraAurangabadfemaleMarathiAudios/Aurangabad/IISc_VaaniProject_S_Maharash...
3Images/IISc_VaaniProject_GENERIC_0073.jpgMaharashtraAurangabadfemaleMarathiAudios/Aurangabad/IISc_VaaniProject_S_Maharash...
4Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0...MaharashtraAurangabadfemaleMarathiAudios/Aurangabad/IISc_VaaniProject_S_Maharash...
.....................
9584927Images/IISc_VaaniProject_GENERIC_0554.jpgKarnatakaChamarajanagarfemaleKannadaAudios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj...
9584928Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC...KarnatakaChamarajanagarfemaleKannadaAudios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj...
9584929Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC...KarnatakaChamarajanagarfemaleKannadaAudios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj...
9584930Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC...KarnatakaChamarajanagarfemaleKannadaAudios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj...
9584931Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC...KarnatakaChamarajanagarfemaleKannadaAudios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj...
\n", "

9584932 rows × 6 columns

\n", "
" ], "text/plain": [ " image_name state \\\n", "0 Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0... Maharashtra \n", "1 Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0... Maharashtra \n", "2 Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0... Maharashtra \n", "3 Images/IISc_VaaniProject_GENERIC_0073.jpg Maharashtra \n", "4 Images/IISc_VaaniProject_Aurangabad-SPECIFIC_0... Maharashtra \n", "... ... ... \n", "9584927 Images/IISc_VaaniProject_GENERIC_0554.jpg Karnataka \n", "9584928 Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC... Karnataka \n", "9584929 Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC... Karnataka \n", "9584930 Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC... Karnataka \n", "9584931 Images/IISc_VaaniProject_Chamrajnagar-SPECIFIC... Karnataka \n", "\n", " district gender audio_language \\\n", "0 Aurangabad female Marathi \n", "1 Aurangabad female Marathi \n", "2 Aurangabad female Marathi \n", "3 Aurangabad female Marathi \n", "4 Aurangabad female Marathi \n", "... ... ... ... \n", "9584927 Chamarajanagar female Kannada \n", "9584928 Chamarajanagar female Kannada \n", "9584929 Chamarajanagar female Kannada \n", "9584930 Chamarajanagar female Kannada \n", "9584931 Chamarajanagar female Kannada \n", "\n", " audio_name \n", "0 Audios/Aurangabad/IISc_VaaniProject_S_Maharash... \n", "1 Audios/Aurangabad/IISc_VaaniProject_S_Maharash... \n", "2 Audios/Aurangabad/IISc_VaaniProject_S_Maharash... \n", "3 Audios/Aurangabad/IISc_VaaniProject_S_Maharash... \n", "4 Audios/Aurangabad/IISc_VaaniProject_S_Maharash... \n", "... ... \n", "9584927 Audios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj... \n", "9584928 Audios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj... \n", "9584929 Audios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj... \n", "9584930 Audios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj... \n", "9584931 Audios/Chamrajn/IISc_VaaniProject_M_KA_Chamraj... \n", "\n", "[9584932 rows x 6 columns]" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "'Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg'" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "p = os.path.join('Images', os.path.basename(files[0]))\n", "p" ] }, { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [ { "data": { "application/vnd.microsoft.datawrangler.viewer.v0+json": { "columns": [ { "name": "index", "rawType": "int64", "type": "integer" }, { "name": "image_name", "rawType": "object", "type": "string" }, { "name": "state", "rawType": "object", "type": "string" }, { "name": "district", "rawType": "object", "type": "string" }, { "name": "gender", "rawType": "object", "type": "string" }, { "name": "audio_language", "rawType": "object", "type": "string" }, { "name": "audio_name", "rawType": "object", "type": "string" } ], "conversionMethod": "pd.DataFrame", "ref": "8cef37c1-a594-4208-b785-3ab1520e5576", "rows": [ [ "293605", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_115366_11825947_BHSNFLM_373965_3972_8381.wav" ], [ "746685", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_68677_9763129_BHSNFLM_373965_4831_16681.wav" ], [ "746694", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_68677_9763129_BHSNFLM_373965_0_4688.wav" ], [ "855359", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_114451_11750003_BHSNFLM_373965_920_15685.wav" ], [ "1156285", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_67279_9697960_BHSNFLM_373965_13465_20345.wav" ], [ "1156411", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_67279_9697960_BHSNFLM_373965_382_12665.wav" ], [ "1157007", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_107632_11368339_BHSNFLM_373965_7285_19974.wav" ], [ "1157034", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_107632_11368339_BHSNFLM_373965_8_6799.wav" ], [ "1157692", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_117318_11923086_BHSNFLM_373965_8_12838.wav" ], [ "1157740", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_117318_11923086_BHSNFLM_373965_13005_20472.wav" ], [ "1175331", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_115366_11825947_BHSNFLM_373965_8723_14075.wav" ], [ "1175333", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_115366_11825947_BHSNFLM_373965_202_3870.wav" ], [ "1175337", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_115366_11825947_BHSNFLM_373965_14482_17161.wav" ], [ "1819646", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_113569_11690730_BHSNFLM_373965_8672_21217.wav" ], [ "1819672", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_113569_11690730_BHSNFLM_373965_258_8672.wav" ], [ "1865417", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_91175_10705139_BHSNFLM_373965_9544_18884.wav" ], [ "1865471", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_91175_10705139_BHSNFLM_373965_96_9457.wav" ], [ "3671185", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur86934_1332240000_BHSNFLM_373965_13480_19323.wav" ], [ "3671243", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur86934_1332240000_BHSNFLM_373965_8084_13480.wav" ], [ "3671634", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur86934_1332240000_BHSNFLM_373965_196_8084.wav" ], [ "3671964", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur86934_1332240000_BHSNFLM_373965_19730_25280.wav" ], [ "3798111", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Mith32120_0904480000_BHSNFLM_373965_14528_24000.wav" ], [ "3798414", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Mith32120_0904480000_BHSNFLM_373965_8981_14016.wav" ], [ "3810415", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Subo24123_1042410000_BHSNFLM_373965_160_11690.wav" ], [ "3810522", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Subo24123_1042410000_BHSNFLM_373965_12213_22282.wav" ], [ "3811369", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manv38774_0503570000_BHSNFLM_373965_384_18069.wav" ], [ "3812246", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manb26396_0441150000_BHSNFLM_373965_11064_20816.wav" ], [ "3812319", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manb26396_0441150000_BHSNFLM_373965_185_10704.wav" ], [ "3834285", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Nish68757_0724000000_BHSNFLM_373965_208_20108.wav" ], [ "3864517", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish36312_0124470000_BHSNFLM_373965_8245_11744.wav" ], [ "3864597", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish36312_0124470000_BHSNFLM_373965_5088_7872.wav" ], [ "3864870", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish36312_0124470000_BHSNFLM_373965_12128_15722.wav" ], [ "3865418", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish36312_0124470000_BHSNFLM_373965_16245_19200.wav" ], [ "3927003", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita26632_0741560000_BHSNFLM_373965_149_8842.wav" ], [ "3927228", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita26632_0741560000_BHSNFLM_373965_21504_24490.wav" ], [ "3927319", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita26632_0741560000_BHSNFLM_373965_9152_21237.wav" ], [ "5897778", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki32151_1537230000_BHSNFLM_373965_16353_18143.wav" ], [ "5897788", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki32151_1537230000_BHSNFLM_373965_7074_15343.wav" ], [ "5897804", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki32151_1537230000_BHSNFLM_373965_1245_5600.wav" ], [ "8102521", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_22810_24064.wav" ], [ "8102523", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_19486_22445.wav" ], [ "8102524", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_17152_18802.wav" ], [ "8102527", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_15295_16896.wav" ], [ "8102528", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_11104_12593.wav" ], [ "8102529", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_4922_6538.wav" ], [ "8102532", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "male", "Bhojpuri", "/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Riti86163_1129420000_BHSNFLM_373965_1365_4550.wav" ], [ "9279230", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "/Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_119116_11958252_BHSNFLM_373965_8284_18571.wav" ], [ "9279241", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "/Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_119116_11958252_BHSNFLM_373965_734_7603.wav" ], [ "9287139", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "/Audios/Saran/IISc_VaaniProject_S_BR_Saran_99773_11031891_BHSNFLM_373965_10159_18256.wav" ], [ "9287145", "Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg", "Bihar", "Saran", "female", "Hindi", "/Audios/Saran/IISc_VaaniProject_S_BR_Saran_99773_11031891_BHSNFLM_373965_0_10159.wav" ] ], "shape": { "columns": 6, "rows": 50 } }, "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
image_namestatedistrictgenderaudio_languageaudio_name
293605Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
746685Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_6...
746694Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_6...
855359Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1156285Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_6...
1156411Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_6...
1157007Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1157034Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1157692Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1157740Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1175331Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1175333Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1175337Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1819646Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1819672Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_1...
1865417Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_9...
1865471Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_S_Bihar_Saran_9...
3671185Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anur...
3671243Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anur...
3671634Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anur...
3671964Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anur...
3798111Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Mith...
3798414Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Mith...
3810415Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Subo...
3810522Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Subo...
3811369Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Manv...
3812246Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Manb...
3812319Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Manb...
3834285Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Nish...
3864517Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Bish...
3864597Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Bish...
3864870Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Bish...
3865418Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Bish...
3927003Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Rita...
3927228Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Rita...
3927319Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Rita...
5897778Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anki...
5897788Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anki...
5897804Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindiAudios/Saran/IISc_VaaniProject_M_BR_Saran_Anki...
8102521Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102523Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102524Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102527Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102528Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102529Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
8102532Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranmaleBhojpuri/Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit...
9279230Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindi/Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_...
9279241Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindi/Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_...
9287139Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindi/Audios/Saran/IISc_VaaniProject_S_BR_Saran_997...
9287145Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpgBiharSaranfemaleHindi/Audios/Saran/IISc_VaaniProject_S_BR_Saran_997...
\n", "
" ], "text/plain": [ " image_name state district \\\n", "293605 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "746685 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "746694 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "855359 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1156285 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1156411 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1157007 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1157034 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1157692 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1157740 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1175331 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1175333 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1175337 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1819646 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1819672 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1865417 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "1865471 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3671185 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3671243 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3671634 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3671964 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3798111 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3798414 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3810415 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3810522 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3811369 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3812246 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3812319 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3834285 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3864517 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3864597 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3864870 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3865418 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3927003 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3927228 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "3927319 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "5897778 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "5897788 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "5897804 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102521 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102523 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102524 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102527 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102528 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102529 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "8102532 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "9279230 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "9279241 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "9287139 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "9287145 Images/IISc_VaaniProject_Saran-SPECIFIC_00486.jpg Bihar Saran \n", "\n", " gender audio_language \\\n", "293605 male Hindi \n", "746685 male Hindi \n", "746694 male Hindi \n", "855359 female Hindi \n", "1156285 female Hindi \n", "1156411 female Hindi \n", "1157007 female Hindi \n", "1157034 female Hindi \n", "1157692 male Hindi \n", "1157740 male Hindi \n", "1175331 male Hindi \n", "1175333 male Hindi \n", "1175337 male Hindi \n", "1819646 female Hindi \n", "1819672 female Hindi \n", "1865417 male Hindi \n", "1865471 male Hindi \n", "3671185 female Hindi \n", "3671243 female Hindi \n", "3671634 female Hindi \n", "3671964 female Hindi \n", "3798111 female Hindi \n", "3798414 female Hindi \n", "3810415 male Hindi \n", "3810522 male Hindi \n", "3811369 female Hindi \n", "3812246 female Hindi \n", "3812319 female Hindi \n", "3834285 female Hindi \n", "3864517 male Hindi \n", "3864597 male Hindi \n", "3864870 male Hindi \n", "3865418 male Hindi \n", "3927003 female Hindi \n", "3927228 female Hindi \n", "3927319 female Hindi \n", "5897778 female Hindi \n", "5897788 female Hindi \n", "5897804 female Hindi \n", "8102521 male Bhojpuri \n", "8102523 male Bhojpuri \n", "8102524 male Bhojpuri \n", "8102527 male Bhojpuri \n", "8102528 male Bhojpuri \n", "8102529 male Bhojpuri \n", "8102532 male Bhojpuri \n", "9279230 female Hindi \n", "9279241 female Hindi \n", "9287139 female Hindi \n", "9287145 female Hindi \n", "\n", " audio_name \n", "293605 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "746685 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_6... \n", "746694 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_6... \n", "855359 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1156285 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_6... \n", "1156411 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_6... \n", "1157007 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1157034 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1157692 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1157740 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1175331 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1175333 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1175337 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1819646 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1819672 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_1... \n", "1865417 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_9... \n", "1865471 Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_9... \n", "3671185 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur... \n", "3671243 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur... \n", "3671634 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur... \n", "3671964 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anur... \n", "3798111 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Mith... \n", "3798414 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Mith... \n", "3810415 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Subo... \n", "3810522 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Subo... \n", "3811369 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manv... \n", "3812246 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manb... \n", "3812319 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Manb... \n", "3834285 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Nish... \n", "3864517 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish... \n", "3864597 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish... \n", "3864870 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish... \n", "3865418 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Bish... \n", "3927003 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita... \n", "3927228 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita... \n", "3927319 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rita... \n", "5897778 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki... \n", "5897788 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki... \n", "5897804 Audios/Saran/IISc_VaaniProject_M_BR_Saran_Anki... \n", "8102521 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102523 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102524 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102527 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102528 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102529 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "8102532 /Audios/Saran/IISc_VaaniProject_M_BR_Saran_Rit... \n", "9279230 /Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_... \n", "9279241 /Audios/Saran/IISc_VaaniProject_S_Bihar_Saran_... \n", "9287139 /Audios/Saran/IISc_VaaniProject_S_BR_Saran_997... \n", "9287145 /Audios/Saran/IISc_VaaniProject_S_BR_Saran_997... " ] }, "execution_count": 23, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df[df.image_name == p]" ] } ], "metadata": { "kernelspec": { "display_name": "aku_env", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.12.9" } }, "nbformat": 4, "nbformat_minor": 2 }