{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "4e64d318", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " dataset_id \\\n", "0 akjadhav/leandojo-lean4-formal-informal-strings \n", "1 aemska/stuhl \n", "2 Pogpotatofarmer/memes \n", "3 Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h \n", "4 chamisfum/brain_tumor_3_classes \n", "\n", " dataset_url downloads author \\\n", "0 https://huggingface.co/datasets/akjadhav/leand... 22 None \n", "1 https://huggingface.co/datasets/aemska/stuhl 11 None \n", "2 https://huggingface.co/datasets/Pogpotatofarme... 15 None \n", "3 https://huggingface.co/datasets/Splend1dchan/N... 11 None \n", "4 https://huggingface.co/datasets/chamisfum/brai... 8 None \n", "\n", " license tags task_categories last_modified \\\n", "0 None None None 2024-01-30 07:40:02+00:00 \n", "1 openrail None None 2022-11-11 14:12:36+00:00 \n", "2 cc None None 2022-07-15 21:11:34+00:00 \n", "3 None None None None \n", "4 None None None None \n", "\n", " reason \\\n", "0 No metadata and no description \n", "1 Short description (char count=0, words=0) \n", "2 Short description (char count=0, words=0) \n", "3 Failed to load card \n", "4 Failed to load card \n", "\n", " readme_path word_count category \n", "0 dataset_readmes/akjadhav__leandojo-lean4-forma... 0 minimal \n", "1 dataset_readmes/aemska__stuhl_README.md 0 minimal \n", "2 dataset_readmes/Pogpotatofarmer__memes_README.md 0 minimal \n", "3 None 0 minimal \n", "4 None 0 minimal \n", " dataset_id \\\n", "0 autoevaluate/autoeval-staging-eval-launch__gov... \n", "1 autoevaluate/autoeval-eval-emotion-default-fe1... \n", "2 LTCB/enwik8 \n", "3 boltuix/emotions-dataset \n", "4 yixuantt/MultiHopRAG \n", "\n", " dataset_url downloads author \\\n", "0 https://huggingface.co/datasets/autoevaluate/a... 8 None \n", "1 https://huggingface.co/datasets/autoevaluate/a... 8 None \n", "2 https://huggingface.co/datasets/LTCB/enwik8 154 None \n", "3 https://huggingface.co/datasets/boltuix/emotio... 754 None \n", "4 https://huggingface.co/datasets/yixuantt/Multi... 7050 None \n", "\n", " license tags \\\n", "0 None autotrain, evaluation \n", "1 None autotrain, evaluation \n", "2 ['mit'] None \n", "3 mit emotions, nlp, sentiment-analysis, emotion-cla... \n", "4 odc-by None \n", "\n", " task_categories last_modified reason \\\n", "0 None 2022-09-09 07:44:04+00:00 None \n", "1 None 2022-09-16 20:22:59+00:00 None \n", "2 fill-mask, text-generation 2024-01-18 11:19:13+00:00 None \n", "3 None 2025-05-25 15:41:59+00:00 None \n", "4 question-answering, feature-extraction 2024-01-30 02:49:29+00:00 None \n", "\n", " readme_path word_count category \n", "0 dataset_readmes/autoevaluate__autoeval-staging... 55 rich \n", "1 dataset_readmes/autoevaluate__autoeval-eval-em... 57 rich \n", "2 dataset_readmes/LTCB__enwik8_README.md 427 rich \n", "3 dataset_readmes/boltuix__emotions-dataset_READ... 1643 rich \n", "4 dataset_readmes/yixuantt__MultiHopRAG_README.md 111 rich \n" ] } ], "source": [ "import pandas as pd\n", "\n", "# Read parquet files\n", "df1 = pd.read_parquet(\"/home/santosh/Repositories/personal/huggingface/dataset-insight-portal/all_minimal_dataset_cards.parquet\")\n", "df2 = pd.read_parquet(\"/home/santosh/Repositories/personal/huggingface/dataset-insight-portal/all_rich_dataset_cards.parquet\")\n", "\n", "# Display first few rows\n", "print(df1.head())\n", "print(df2.head())" ] }, { "cell_type": "code", "execution_count": 2, "id": "e9a20931", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | dataset_id | \n", "dataset_url | \n", "downloads | \n", "author | \n", "license | \n", "tags | \n", "task_categories | \n", "last_modified | \n", "reason | \n", "readme_path | \n", "word_count | \n", "category | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "https://huggingface.co/datasets/akjadhav/leand... | \n", "22 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2024-01-30 07:40:02+00:00 | \n", "No metadata and no description | \n", "dataset_readmes/akjadhav__leandojo-lean4-forma... | \n", "0 | \n", "minimal | \n", "
1 | \n", "aemska/stuhl | \n", "https://huggingface.co/datasets/aemska/stuhl | \n", "11 | \n", "None | \n", "openrail | \n", "None | \n", "None | \n", "2022-11-11 14:12:36+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/aemska__stuhl_README.md | \n", "0 | \n", "minimal | \n", "
2 | \n", "Pogpotatofarmer/memes | \n", "https://huggingface.co/datasets/Pogpotatofarme... | \n", "15 | \n", "None | \n", "cc | \n", "None | \n", "None | \n", "2022-07-15 21:11:34+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Pogpotatofarmer__memes_README.md | \n", "0 | \n", "minimal | \n", "
3 | \n", "Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h | \n", "https://huggingface.co/datasets/Splend1dchan/N... | \n", "11 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "
4 | \n", "chamisfum/brain_tumor_3_classes | \n", "https://huggingface.co/datasets/chamisfum/brai... | \n", "8 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
400292 | \n", "TAUR-dev/D-EVAL__standard_eval_v3__RC_BF_ab-bo... | \n", "https://huggingface.co/datasets/TAUR-dev/D-EVA... | \n", "0 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2025-09-19 06:27:52+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/TAUR-dev__D-EVAL__standard_eva... | \n", "0 | \n", "minimal | \n", "
400293 | \n", "TAUR-dev/D-EVAL__standard_eval_v3__RC_BF_ab-bo... | \n", "https://huggingface.co/datasets/TAUR-dev/D-EVA... | \n", "0 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2025-09-19 06:28:16+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/TAUR-dev__D-EVAL__standard_eva... | \n", "0 | \n", "minimal | \n", "
400294 | \n", "haru101/Minecraft-Knowledge-Dataset | \n", "https://huggingface.co/datasets/haru101/Minecr... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "None | \n", "question-answering | \n", "2025-09-19 06:33:33+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/haru101__Minecraft-Knowledge-D... | \n", "0 | \n", "minimal | \n", "
400295 | \n", "sxj1215/mmimdb_sorted_with_label_2 | \n", "https://huggingface.co/datasets/sxj1215/mmimdb... | \n", "0 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2025-09-19 06:35:25+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/sxj1215__mmimdb_sorted_with_la... | \n", "0 | \n", "minimal | \n", "
400296 | \n", "Vikir2411CS19/Multimodal_Complaint | \n", "https://huggingface.co/datasets/Vikir2411CS19/... | \n", "0 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2025-09-19 06:35:01+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Vikir2411CS19__Multimodal_Comp... | \n", "0 | \n", "minimal | \n", "
400297 rows × 12 columns
\n", "\n", " | id | \n", "url | \n", "field | \n", "keyword | \n", "missing_readme | \n", "missing_card | \n", "
---|---|---|---|---|---|---|
0 | \n", "solomonk/reddit_mental_health_posts | \n", "https://huggingface.co/datasets/solomonk/reddi... | \n", "life_sciences | \n", "health | \n", "False | \n", "True | \n", "
1 | \n", "Kira-Asimov/gender_clinical_trial | \n", "https://huggingface.co/datasets/Kira-Asimov/ge... | \n", "life_sciences | \n", "clinical | \n", "False | \n", "True | \n", "
2 | \n", "samhog/psychology-6k | \n", "https://huggingface.co/datasets/samhog/psychol... | \n", "life_sciences | \n", "psychology | \n", "True | \n", "True | \n", "
3 | \n", "TCMLM/real_clinical_cases_of_Famous_Old_TCM_Do... | \n", "https://huggingface.co/datasets/TCMLM/real_cli... | \n", "life_sciences | \n", "clinical | \n", "False | \n", "True | \n", "
4 | \n", "jibrand/plant-dataset-JSONL | \n", "https://huggingface.co/datasets/jibrand/plant-... | \n", "agriculture_and_biology | \n", "plant | \n", "True | \n", "True | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
4035 | \n", "AshwinManohar/medicine_normalizer_alpaca | \n", "https://huggingface.co/datasets/AshwinManohar/... | \n", "life_sciences | \n", "medicine | \n", "True | \n", "True | \n", "
4036 | \n", "AshwinManohar/medicine_parser_alpaca | \n", "https://huggingface.co/datasets/AshwinManohar/... | \n", "life_sciences | \n", "medicine | \n", "True | \n", "True | \n", "
4037 | \n", "AshwinManohar/medicine_normalizer_alpaca_20k | \n", "https://huggingface.co/datasets/AshwinManohar/... | \n", "life_sciences | \n", "medicine | \n", "True | \n", "True | \n", "
4038 | \n", "Adithyaaaa/plant_leaf_classification | \n", "https://huggingface.co/datasets/Adithyaaaa/pla... | \n", "agriculture_and_biology | \n", "plant | \n", "True | \n", "True | \n", "
4039 | \n", "benali-ai-24/drug-data-public | \n", "https://huggingface.co/datasets/benali-ai-24/d... | \n", "life_sciences | \n", "drug | \n", "True | \n", "True | \n", "
4040 rows × 6 columns
\n", "\n", " | dataset_id | \n", "dataset_url | \n", "downloads | \n", "author | \n", "license | \n", "tags | \n", "task_categories | \n", "last_modified | \n", "reason | \n", "readme_path | \n", "word_count | \n", "category | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "https://huggingface.co/datasets/akjadhav/leand... | \n", "22 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2024-01-30 07:40:02+00:00 | \n", "No metadata and no description | \n", "dataset_readmes/akjadhav__leandojo-lean4-forma... | \n", "0 | \n", "minimal | \n", "
1 | \n", "aemska/stuhl | \n", "https://huggingface.co/datasets/aemska/stuhl | \n", "11 | \n", "None | \n", "openrail | \n", "None | \n", "None | \n", "2022-11-11 14:12:36+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/aemska__stuhl_README.md | \n", "0 | \n", "minimal | \n", "
2 | \n", "Pogpotatofarmer/memes | \n", "https://huggingface.co/datasets/Pogpotatofarme... | \n", "15 | \n", "None | \n", "cc | \n", "None | \n", "None | \n", "2022-07-15 21:11:34+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Pogpotatofarmer__memes_README.md | \n", "0 | \n", "minimal | \n", "
3 | \n", "Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h | \n", "https://huggingface.co/datasets/Splend1dchan/N... | \n", "11 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "
4 | \n", "chamisfum/brain_tumor_3_classes | \n", "https://huggingface.co/datasets/chamisfum/brai... | \n", "8 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
503185 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_14 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:28:15+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "
503186 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_15 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:29:40+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "
503187 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_5 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:30:53+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "
503188 | \n", "chenxing1234567890/eval_testZ1.2.1 | \n", "https://huggingface.co/datasets/chenxing123456... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, tutorial | \n", "robotics | \n", "2025-09-19 06:34:11+00:00 | \n", "None | \n", "dataset_readmes/chenxing1234567890__eval_testZ... | \n", "231 | \n", "rich | \n", "
503189 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_6 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:34:09+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "
503190 rows × 12 columns
\n", "\n", " | dataset_id | \n", "dataset_url | \n", "downloads | \n", "author | \n", "license | \n", "tags | \n", "task_categories | \n", "last_modified | \n", "reason | \n", "readme_path | \n", "word_count | \n", "category | \n", "_dataset_id_lower | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "https://huggingface.co/datasets/akjadhav/leand... | \n", "22 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2024-01-30 07:40:02+00:00 | \n", "No metadata and no description | \n", "dataset_readmes/akjadhav__leandojo-lean4-forma... | \n", "0 | \n", "minimal | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "
1 | \n", "aemska/stuhl | \n", "https://huggingface.co/datasets/aemska/stuhl | \n", "11 | \n", "None | \n", "openrail | \n", "None | \n", "None | \n", "2022-11-11 14:12:36+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/aemska__stuhl_README.md | \n", "0 | \n", "minimal | \n", "aemska/stuhl | \n", "
2 | \n", "Pogpotatofarmer/memes | \n", "https://huggingface.co/datasets/Pogpotatofarme... | \n", "15 | \n", "None | \n", "cc | \n", "None | \n", "None | \n", "2022-07-15 21:11:34+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Pogpotatofarmer__memes_README.md | \n", "0 | \n", "minimal | \n", "pogpotatofarmer/memes | \n", "
3 | \n", "Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h | \n", "https://huggingface.co/datasets/Splend1dchan/N... | \n", "11 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "splend1dchan/nmsqa_sew-d-tiny-100k-ft-ls100h | \n", "
4 | \n", "chamisfum/brain_tumor_3_classes | \n", "https://huggingface.co/datasets/chamisfum/brai... | \n", "8 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "chamisfum/brain_tumor_3_classes | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
503185 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_14 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:28:15+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "robotis/ffw_bg2_rev4_pick_coffee_bottle_env5_14 | \n", "
503186 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_15 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:29:40+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "robotis/ffw_bg2_rev4_pick_coffee_bottle_env5_15 | \n", "
503187 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_5 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:30:53+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "dongkkka/ffw_bg2_rev4_custom_0919_5 | \n", "
503188 | \n", "chenxing1234567890/eval_testZ1.2.1 | \n", "https://huggingface.co/datasets/chenxing123456... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, tutorial | \n", "robotics | \n", "2025-09-19 06:34:11+00:00 | \n", "None | \n", "dataset_readmes/chenxing1234567890__eval_testZ... | \n", "231 | \n", "rich | \n", "chenxing1234567890/eval_testz1.2.1 | \n", "
503189 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_6 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:34:09+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "dongkkka/ffw_bg2_rev4_custom_0919_6 | \n", "
503190 rows × 13 columns
\n", "\n", " | dataset_id | \n", "dataset_url | \n", "downloads | \n", "author | \n", "license | \n", "tags | \n", "task_categories | \n", "last_modified | \n", "reason | \n", "readme_path | \n", "word_count | \n", "category | \n", "field | \n", "keyword | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "https://huggingface.co/datasets/akjadhav/leand... | \n", "22 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "2024-01-30 07:40:02+00:00 | \n", "No metadata and no description | \n", "dataset_readmes/akjadhav__leandojo-lean4-forma... | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
1 | \n", "aemska/stuhl | \n", "https://huggingface.co/datasets/aemska/stuhl | \n", "11 | \n", "None | \n", "openrail | \n", "None | \n", "None | \n", "2022-11-11 14:12:36+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/aemska__stuhl_README.md | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
2 | \n", "Pogpotatofarmer/memes | \n", "https://huggingface.co/datasets/Pogpotatofarme... | \n", "15 | \n", "None | \n", "cc | \n", "None | \n", "None | \n", "2022-07-15 21:11:34+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Pogpotatofarmer__memes_README.md | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
3 | \n", "Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h | \n", "https://huggingface.co/datasets/Splend1dchan/N... | \n", "11 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
4 | \n", "chamisfum/brain_tumor_3_classes | \n", "https://huggingface.co/datasets/chamisfum/brai... | \n", "8 | \n", "None | \n", "None | \n", "None | \n", "None | \n", "None | \n", "Failed to load card | \n", "None | \n", "0 | \n", "minimal | \n", "life_sciences | \n", "brain | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
503185 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_14 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:28:15+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503186 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_15 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:29:40+00:00 | \n", "None | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503187 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_5 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:30:53+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503188 | \n", "chenxing1234567890/eval_testZ1.2.1 | \n", "https://huggingface.co/datasets/chenxing123456... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, tutorial | \n", "robotics | \n", "2025-09-19 06:34:11+00:00 | \n", "None | \n", "dataset_readmes/chenxing1234567890__eval_testZ... | \n", "231 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503189 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_6 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "None | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:34:09+00:00 | \n", "None | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503190 rows × 14 columns
\n", "\n", " | dataset_id | \n", "dataset_url | \n", "downloads | \n", "author | \n", "license | \n", "tags | \n", "task_categories | \n", "last_modified | \n", "reason | \n", "readme_path | \n", "word_count | \n", "category | \n", "field | \n", "keyword | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "akjadhav/leandojo-lean4-formal-informal-strings | \n", "https://huggingface.co/datasets/akjadhav/leand... | \n", "22 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "2024-01-30 07:40:02+00:00 | \n", "No metadata and no description | \n", "dataset_readmes/akjadhav__leandojo-lean4-forma... | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
1 | \n", "aemska/stuhl | \n", "https://huggingface.co/datasets/aemska/stuhl | \n", "11 | \n", "NaN | \n", "openrail | \n", "NaN | \n", "NaN | \n", "2022-11-11 14:12:36+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/aemska__stuhl_README.md | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
2 | \n", "Pogpotatofarmer/memes | \n", "https://huggingface.co/datasets/Pogpotatofarme... | \n", "15 | \n", "NaN | \n", "cc | \n", "NaN | \n", "NaN | \n", "2022-07-15 21:11:34+00:00 | \n", "Short description (char count=0, words=0) | \n", "dataset_readmes/Pogpotatofarmer__memes_README.md | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
3 | \n", "Splend1dchan/NMSQA_sew-d-tiny-100k-ft-ls100h | \n", "https://huggingface.co/datasets/Splend1dchan/N... | \n", "11 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "Failed to load card | \n", "NaN | \n", "0 | \n", "minimal | \n", "NaN | \n", "NaN | \n", "
4 | \n", "chamisfum/brain_tumor_3_classes | \n", "https://huggingface.co/datasets/chamisfum/brai... | \n", "8 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "Failed to load card | \n", "NaN | \n", "0 | \n", "minimal | \n", "life_sciences | \n", "brain | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
503185 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_14 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "NaN | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:28:15+00:00 | \n", "NaN | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503186 | \n", "ROBOTIS/ffw_bg2_rev4_pick_coffee_bottle_env5_15 | \n", "https://huggingface.co/datasets/ROBOTIS/ffw_bg... | \n", "0 | \n", "NaN | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:29:40+00:00 | \n", "NaN | \n", "dataset_readmes/ROBOTIS__ffw_bg2_rev4_pick_cof... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503187 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_5 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "NaN | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:30:53+00:00 | \n", "NaN | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503188 | \n", "chenxing1234567890/eval_testZ1.2.1 | \n", "https://huggingface.co/datasets/chenxing123456... | \n", "0 | \n", "NaN | \n", "apache-2.0 | \n", "LeRobot, tutorial | \n", "robotics | \n", "2025-09-19 06:34:11+00:00 | \n", "NaN | \n", "dataset_readmes/chenxing1234567890__eval_testZ... | \n", "231 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503189 | \n", "Dongkkka/ffw_bg2_rev4_custom_0919_6 | \n", "https://huggingface.co/datasets/Dongkkka/ffw_b... | \n", "0 | \n", "NaN | \n", "apache-2.0 | \n", "LeRobot, ffw_bg2_rev4_custom, robotis | \n", "robotics | \n", "2025-09-19 06:34:09+00:00 | \n", "NaN | \n", "dataset_readmes/Dongkkka__ffw_bg2_rev4_custom_... | \n", "299 | \n", "rich | \n", "NaN | \n", "NaN | \n", "
503190 rows × 14 columns
\n", "