{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import os; os.chdir('..')" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "['Health.csv',\n", " 'Books_and_Literature.csv',\n", " 'Autos_and_Vehicles.csv',\n", " 'Real Estate.csv',\n", " 'Travel_and_Transportation.csv',\n", " 'Law_and_Government.csv',\n", " 'Hobbies_and_Leisure.csv',\n", " 'People_and_Society.csv',\n", " 'Sports.csv',\n", " 'Finance.csv',\n", " 'Science.csv',\n", " 'Sensitive Subjects.csv',\n", " 'Home_and_Garden.csv',\n", " 'Adult.csv',\n", " 'Beauty_and_Fitness.csv',\n", " 'Arts_and_Entertainment.csv',\n", " 'Food_and_Drink.csv',\n", " 'News.csv',\n", " 'Internet_and_Telecom.csv',\n", " 'Games.csv',\n", " 'Reference.csv',\n", " 'Jobs_and_Education.csv',\n", " 'Business_and_Industrial.csv',\n", " 'Shopping.csv',\n", " 'Pets_and_Animals.csv',\n", " 'Computers_and_Electronics.csv',\n", " 'Online Communities.csv']" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "files= os.listdir(\n", " 'data_categories'\n", ")\n", "files.remove(\n", " 'Final_Category_Data_With_Labels.csv'\n", ")\n", "files" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | category | \n", "
---|---|
0 | \n", "Healthy diet plan | \n", "
1 | \n", "Exercise routines | \n", "
2 | \n", "Mental health tips | \n", "
3 | \n", "Weight loss strategies | \n", "
4 | \n", "Heart disease prevention | \n", "
\n", " | category | \n", "
---|---|
0 | \n", "Social media groups | \n", "
1 | \n", "Internet forums | \n", "
2 | \n", "Virtual communities | \n", "
3 | \n", "Online discussion boards | \n", "
4 | \n", "Internet subcultures | \n", "
... | \n", "... | \n", "
1093 | \n", "First Responder Healthcare Services | \n", "
1094 | \n", "Mental Health Support for First Responders | \n", "
1095 | \n", "First Responder Advocacy | \n", "
1096 | \n", "Teacher Health Education | \n", "
1097 | \n", "Teacher Healthcare Services | \n", "
33612 rows × 1 columns
\n", "\n", " | keyword | \n", "intent | \n", "
---|---|---|
0 | \n", "social media groups | \n", "informational | \n", "
1 | \n", "social media groups | \n", "navigational | \n", "
2 | \n", "internet forums | \n", "navigational | \n", "
3 | \n", "virtual communities | \n", "navigational | \n", "
4 | \n", "online discussion boards | \n", "commercial | \n", "
... | \n", "... | \n", "... | \n", "
52318 | \n", "rv camping checklist for kayakers | \n", "transactional | \n", "
52319 | \n", "rv camping checklist for kayakers | \n", "commercial | \n", "
52320 | \n", "car safety for pets traveling by air | \n", "transactional | \n", "
52321 | \n", "car safety for pets traveling by air | \n", "commercial | \n", "
52322 | \n", "motorcycle riding tips for beginners safety gear | \n", "transactional | \n", "
52323 rows × 2 columns
\n", "