Upload files to "/"
This commit is contained in:
parent
1dbfae5442
commit
de68b38f74
668
fitur_ekstraksi_BOW.ipynb
Normal file
668
fitur_ekstraksi_BOW.ipynb
Normal file
@ -0,0 +1,668 @@
|
|||||||
|
{
|
||||||
|
"nbformat": 4,
|
||||||
|
"nbformat_minor": 0,
|
||||||
|
"metadata": {
|
||||||
|
"colab": {
|
||||||
|
"provenance": []
|
||||||
|
},
|
||||||
|
"kernelspec": {
|
||||||
|
"name": "python3",
|
||||||
|
"display_name": "Python 3"
|
||||||
|
},
|
||||||
|
"language_info": {
|
||||||
|
"name": "python"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"cells": [
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": null,
|
||||||
|
"metadata": {
|
||||||
|
"id": "PKHmOczbUdK0"
|
||||||
|
},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"{\n",
|
||||||
|
" \"cells\": [\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 11,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"id\": \"qBYcPYAb059g\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 1. IMPORT LIBRARY\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"import re\\n\",\n",
|
||||||
|
" \"import pandas as pd\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"from sklearn.feature_extraction.text import CountVectorizer\\n\",\n",
|
||||||
|
" \"from sklearn.naive_bayes import MultinomialNB\\n\",\n",
|
||||||
|
" \"from sklearn.metrics import accuracy_score, confusion_matrix, classification_report\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 12,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"id\": \"mo-yt5Ob1N8j\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 2. DATA TEKS MANUAL\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"documents = [\\n\",\n",
|
||||||
|
" \" \\\"saya suka belajar data science\\\",\\n\",\n",
|
||||||
|
" \" \\\"machine learning sangat menarik\\\",\\n\",\n",
|
||||||
|
" \" \\\"saya tidak suka matematika\\\",\\n\",\n",
|
||||||
|
" \" \\\"belajar python itu menyenangkan\\\",\\n\",\n",
|
||||||
|
" \" \\\"data science membutuhkan matematika\\\",\\n\",\n",
|
||||||
|
" \" \\\"python sangat membantu data science\\\"\\n\",\n",
|
||||||
|
" \"]\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"labels = [\\n\",\n",
|
||||||
|
" \" \\\"positif\\\",\\n\",\n",
|
||||||
|
" \" \\\"positif\\\",\\n\",\n",
|
||||||
|
" \" \\\"negatif\\\",\\n\",\n",
|
||||||
|
" \" \\\"positif\\\",\\n\",\n",
|
||||||
|
" \" \\\"netral\\\",\\n\",\n",
|
||||||
|
" \" \\\"positif\\\"\\n\",\n",
|
||||||
|
" \"]\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 13,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"id\": \"FkmxRAFq1oDK\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 3. PREPROCESSING\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"def clean_text(text):\\n\",\n",
|
||||||
|
" \" text = text.lower()\\n\",\n",
|
||||||
|
" \" text = re.sub(r\\\"[^a-z\\\\s]\\\", \\\"\\\", text)\\n\",\n",
|
||||||
|
" \" text = re.sub(r\\\"\\\\s+\\\", \\\" \\\", text).strip()\\n\",\n",
|
||||||
|
" \" return text\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"documents = [clean_text(doc) for doc in documents]\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 14,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"colab\": {\n",
|
||||||
|
" \"base_uri\": \"https://localhost:8080/\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"id\": \"ybC1Vo2C_c3q\",\n",
|
||||||
|
" \"outputId\": \"1695b30d-059d-4bce-e224-7c100b1958ee\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [\n",
|
||||||
|
" {\n",
|
||||||
|
" \"output_type\": \"stream\",\n",
|
||||||
|
" \"name\": \"stdout\",\n",
|
||||||
|
" \"text\": [\n",
|
||||||
|
" \"=== Bag of Words ===\\n\",\n",
|
||||||
|
" \" belajar data itu learning machine matematika membantu membutuhkan \\\\\\n\",\n",
|
||||||
|
" \"0 1 1 0 0 0 0 0 0 \\n\",\n",
|
||||||
|
" \"1 0 0 0 1 1 0 0 0 \\n\",\n",
|
||||||
|
" \"2 0 0 0 0 0 1 0 0 \\n\",\n",
|
||||||
|
" \"3 1 0 1 0 0 0 0 0 \\n\",\n",
|
||||||
|
" \"4 0 1 0 0 0 1 0 1 \\n\",\n",
|
||||||
|
" \"5 0 1 0 0 0 0 1 0 \\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \" menarik menyenangkan python sangat saya science suka tidak \\n\",\n",
|
||||||
|
" \"0 0 0 0 0 1 1 1 0 \\n\",\n",
|
||||||
|
" \"1 1 0 0 1 0 0 0 0 \\n\",\n",
|
||||||
|
" \"2 0 0 0 0 1 0 1 1 \\n\",\n",
|
||||||
|
" \"3 0 1 1 0 0 0 0 0 \\n\",\n",
|
||||||
|
" \"4 0 0 0 0 0 1 0 0 \\n\",\n",
|
||||||
|
" \"5 0 0 1 1 0 1 0 0 \\n\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" }\n",
|
||||||
|
" ],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 4. FEATURE EXTRACTION (BOW)\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"vectorizer = CountVectorizer()\\n\",\n",
|
||||||
|
" \"X = vectorizer.fit_transform(documents)\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"df_bow = pd.DataFrame(\\n\",\n",
|
||||||
|
" \" X.toarray(),\\n\",\n",
|
||||||
|
" \" columns=vectorizer.get_feature_names_out()\\n\",\n",
|
||||||
|
" \")\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"print(\\\"=== Bag of Words ===\\\")\\n\",\n",
|
||||||
|
" \"print(df_bow)\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 15,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"colab\": {\n",
|
||||||
|
" \"base_uri\": \"https://localhost:8080/\",\n",
|
||||||
|
" \"height\": 80\n",
|
||||||
|
" },\n",
|
||||||
|
" \"id\": \"s6S-Ma4R1xuq\",\n",
|
||||||
|
" \"outputId\": \"f65359e3-bb87-42b4-fb37-9c035f88e7ad\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [\n",
|
||||||
|
" {\n",
|
||||||
|
" \"output_type\": \"execute_result\",\n",
|
||||||
|
" \"data\": {\n",
|
||||||
|
" \"text/plain\": [\n",
|
||||||
|
" \"MultinomialNB()\"\n",
|
||||||
|
" ],\n",
|
||||||
|
" \"text/html\": [\n",
|
||||||
|
" \"<style>#sk-container-id-1 {\\n\",\n",
|
||||||
|
" \" /* Definition of color scheme common for light and dark mode */\\n\",\n",
|
||||||
|
" \" --sklearn-color-text: #000;\\n\",\n",
|
||||||
|
" \" --sklearn-color-text-muted: #666;\\n\",\n",
|
||||||
|
" \" --sklearn-color-line: gray;\\n\",\n",
|
||||||
|
" \" /* Definition of color scheme for unfitted estimators */\\n\",\n",
|
||||||
|
" \" --sklearn-color-unfitted-level-0: #fff5e6;\\n\",\n",
|
||||||
|
" \" --sklearn-color-unfitted-level-1: #f6e4d2;\\n\",\n",
|
||||||
|
" \" --sklearn-color-unfitted-level-2: #ffe0b3;\\n\",\n",
|
||||||
|
" \" --sklearn-color-unfitted-level-3: chocolate;\\n\",\n",
|
||||||
|
" \" /* Definition of color scheme for fitted estimators */\\n\",\n",
|
||||||
|
" \" --sklearn-color-fitted-level-0: #f0f8ff;\\n\",\n",
|
||||||
|
" \" --sklearn-color-fitted-level-1: #d4ebff;\\n\",\n",
|
||||||
|
" \" --sklearn-color-fitted-level-2: #b3dbfd;\\n\",\n",
|
||||||
|
" \" --sklearn-color-fitted-level-3: cornflowerblue;\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \" /* Specific color for light theme */\\n\",\n",
|
||||||
|
" \" --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, white)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, black)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-icon: #696969;\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \" @media (prefers-color-scheme: dark) {\\n\",\n",
|
||||||
|
" \" /* Redefinition of color scheme for dark theme */\\n\",\n",
|
||||||
|
" \" --sklearn-color-text-on-default-background: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-background: var(--sg-background-color, var(--theme-background, var(--jp-layout-color0, #111)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-border-box: var(--sg-text-color, var(--theme-code-foreground, var(--jp-content-font-color1, white)));\\n\",\n",
|
||||||
|
" \" --sklearn-color-icon: #878787;\\n\",\n",
|
||||||
|
" \" }\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 {\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 pre {\\n\",\n",
|
||||||
|
" \" padding: 0;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 input.sk-hidden--visually {\\n\",\n",
|
||||||
|
" \" border: 0;\\n\",\n",
|
||||||
|
" \" clip: rect(1px 1px 1px 1px);\\n\",\n",
|
||||||
|
" \" clip: rect(1px, 1px, 1px, 1px);\\n\",\n",
|
||||||
|
" \" height: 1px;\\n\",\n",
|
||||||
|
" \" margin: -1px;\\n\",\n",
|
||||||
|
" \" overflow: hidden;\\n\",\n",
|
||||||
|
" \" padding: 0;\\n\",\n",
|
||||||
|
" \" position: absolute;\\n\",\n",
|
||||||
|
" \" width: 1px;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-dashed-wrapped {\\n\",\n",
|
||||||
|
" \" border: 1px dashed var(--sklearn-color-line);\\n\",\n",
|
||||||
|
" \" margin: 0 0.4em 0.5em 0.4em;\\n\",\n",
|
||||||
|
" \" box-sizing: border-box;\\n\",\n",
|
||||||
|
" \" padding-bottom: 0.4em;\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-container {\\n\",\n",
|
||||||
|
" \" /* jupyter's `normalize.less` sets `[hidden] { display: none; }`\\n\",\n",
|
||||||
|
" \" but bootstrap.min.css set `[hidden] { display: none !important; }`\\n\",\n",
|
||||||
|
" \" so we also need the `!important` here to be able to override the\\n\",\n",
|
||||||
|
" \" default hidden behavior on the sphinx rendered scikit-learn.org.\\n\",\n",
|
||||||
|
" \" See: https://github.com/scikit-learn/scikit-learn/issues/21755 */\\n\",\n",
|
||||||
|
" \" display: inline-block !important;\\n\",\n",
|
||||||
|
" \" position: relative;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-text-repr-fallback {\\n\",\n",
|
||||||
|
" \" display: none;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"div.sk-parallel-item,\\n\",\n",
|
||||||
|
" \"div.sk-serial,\\n\",\n",
|
||||||
|
" \"div.sk-item {\\n\",\n",
|
||||||
|
" \" /* draw centered vertical line to link estimators */\\n\",\n",
|
||||||
|
" \" background-image: linear-gradient(var(--sklearn-color-text-on-default-background), var(--sklearn-color-text-on-default-background));\\n\",\n",
|
||||||
|
" \" background-size: 2px 100%;\\n\",\n",
|
||||||
|
" \" background-repeat: no-repeat;\\n\",\n",
|
||||||
|
" \" background-position: center center;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Parallel-specific style estimator block */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel-item::after {\\n\",\n",
|
||||||
|
" \" content: \\\"\\\";\\n\",\n",
|
||||||
|
" \" width: 100%;\\n\",\n",
|
||||||
|
" \" border-bottom: 2px solid var(--sklearn-color-text-on-default-background);\\n\",\n",
|
||||||
|
" \" flex-grow: 1;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel {\\n\",\n",
|
||||||
|
" \" display: flex;\\n\",\n",
|
||||||
|
" \" align-items: stretch;\\n\",\n",
|
||||||
|
" \" justify-content: center;\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" position: relative;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel-item {\\n\",\n",
|
||||||
|
" \" display: flex;\\n\",\n",
|
||||||
|
" \" flex-direction: column;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel-item:first-child::after {\\n\",\n",
|
||||||
|
" \" align-self: flex-end;\\n\",\n",
|
||||||
|
" \" width: 50%;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel-item:last-child::after {\\n\",\n",
|
||||||
|
" \" align-self: flex-start;\\n\",\n",
|
||||||
|
" \" width: 50%;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-parallel-item:only-child::after {\\n\",\n",
|
||||||
|
" \" width: 0;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Serial-specific style estimator block */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-serial {\\n\",\n",
|
||||||
|
" \" display: flex;\\n\",\n",
|
||||||
|
" \" flex-direction: column;\\n\",\n",
|
||||||
|
" \" align-items: center;\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" padding-right: 1em;\\n\",\n",
|
||||||
|
" \" padding-left: 1em;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Toggleable style: style used for estimator/Pipeline/ColumnTransformer box that is\\n\",\n",
|
||||||
|
" \"clickable and can be expanded/collapsed.\\n\",\n",
|
||||||
|
" \"- Pipeline and ColumnTransformer use this feature and define the default style\\n\",\n",
|
||||||
|
" \"- Estimators will overwrite some part of the style using the `sk-estimator` class\\n\",\n",
|
||||||
|
" \"*/\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Pipeline and ColumnTransformer style (default) */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-toggleable {\\n\",\n",
|
||||||
|
" \" /* Default theme specific background. It is overwritten whether we have a\\n\",\n",
|
||||||
|
" \" specific estimator or a Pipeline/ColumnTransformer */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Toggleable label */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" cursor: pointer;\\n\",\n",
|
||||||
|
" \" display: flex;\\n\",\n",
|
||||||
|
" \" width: 100%;\\n\",\n",
|
||||||
|
" \" margin-bottom: 0;\\n\",\n",
|
||||||
|
" \" padding: 0.5em;\\n\",\n",
|
||||||
|
" \" box-sizing: border-box;\\n\",\n",
|
||||||
|
" \" text-align: center;\\n\",\n",
|
||||||
|
" \" align-items: start;\\n\",\n",
|
||||||
|
" \" justify-content: space-between;\\n\",\n",
|
||||||
|
" \" gap: 0.5em;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 label.sk-toggleable__label .caption {\\n\",\n",
|
||||||
|
" \" font-size: 0.6rem;\\n\",\n",
|
||||||
|
" \" font-weight: lighter;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text-muted);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 label.sk-toggleable__label-arrow:before {\\n\",\n",
|
||||||
|
" \" /* Arrow on the left of the label */\\n\",\n",
|
||||||
|
" \" content: \\\"▸\\\";\\n\",\n",
|
||||||
|
" \" float: left;\\n\",\n",
|
||||||
|
" \" margin-right: 0.25em;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-icon);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 label.sk-toggleable__label-arrow:hover:before {\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Toggleable content - dropdown */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-toggleable__content {\\n\",\n",
|
||||||
|
" \" max-height: 0;\\n\",\n",
|
||||||
|
" \" max-width: 0;\\n\",\n",
|
||||||
|
" \" overflow: hidden;\\n\",\n",
|
||||||
|
" \" text-align: left;\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-toggleable__content.fitted {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-toggleable__content pre {\\n\",\n",
|
||||||
|
" \" margin: 0.2em;\\n\",\n",
|
||||||
|
" \" border-radius: 0.25em;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-toggleable__content.fitted pre {\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 input.sk-toggleable__control:checked~div.sk-toggleable__content {\\n\",\n",
|
||||||
|
" \" /* Expand drop-down */\\n\",\n",
|
||||||
|
" \" max-height: 200px;\\n\",\n",
|
||||||
|
" \" max-width: 100%;\\n\",\n",
|
||||||
|
" \" overflow: auto;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 input.sk-toggleable__control:checked~label.sk-toggleable__label-arrow:before {\\n\",\n",
|
||||||
|
" \" content: \\\"▾\\\";\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Pipeline/ColumnTransformer-specific style */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label input.sk-toggleable__control:checked~label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Estimator-specific style */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Colorize estimator box */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator input.sk-toggleable__control:checked~label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator.fitted input.sk-toggleable__control:checked~label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label label.sk-toggleable__label,\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label label {\\n\",\n",
|
||||||
|
" \" /* The background is the default theme color */\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text-on-default-background);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* On hover, darken the color of the background */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label:hover label.sk-toggleable__label {\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Label box, darken color on hover, fitted */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label.fitted:hover label.sk-toggleable__label.fitted {\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Estimator label */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label label {\\n\",\n",
|
||||||
|
" \" font-family: monospace;\\n\",\n",
|
||||||
|
" \" font-weight: bold;\\n\",\n",
|
||||||
|
" \" display: inline-block;\\n\",\n",
|
||||||
|
" \" line-height: 1.2em;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-label-container {\\n\",\n",
|
||||||
|
" \" text-align: center;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Estimator-specific */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator {\\n\",\n",
|
||||||
|
" \" font-family: monospace;\\n\",\n",
|
||||||
|
" \" border: 1px dotted var(--sklearn-color-border-box);\\n\",\n",
|
||||||
|
" \" border-radius: 0.25em;\\n\",\n",
|
||||||
|
" \" box-sizing: border-box;\\n\",\n",
|
||||||
|
" \" margin-bottom: 0.5em;\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator.fitted {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-0);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* on hover */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator:hover {\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 div.sk-estimator.fitted:hover {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-2);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Specification for estimator info (e.g. \\\"i\\\" and \\\"?\\\") */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Common style for \\\"i\\\" and \\\"?\\\" */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link,\\n\",\n",
|
||||||
|
" \"a:link.sk-estimator-doc-link,\\n\",\n",
|
||||||
|
" \"a:visited.sk-estimator-doc-link {\\n\",\n",
|
||||||
|
" \" float: right;\\n\",\n",
|
||||||
|
" \" font-size: smaller;\\n\",\n",
|
||||||
|
" \" line-height: 1em;\\n\",\n",
|
||||||
|
" \" font-family: monospace;\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" border-radius: 1em;\\n\",\n",
|
||||||
|
" \" height: 1em;\\n\",\n",
|
||||||
|
" \" width: 1em;\\n\",\n",
|
||||||
|
" \" text-decoration: none !important;\\n\",\n",
|
||||||
|
" \" margin-left: 0.5em;\\n\",\n",
|
||||||
|
" \" text-align: center;\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" border: var(--sklearn-color-unfitted-level-1) 1pt solid;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-unfitted-level-1);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link.fitted,\\n\",\n",
|
||||||
|
" \"a:link.sk-estimator-doc-link.fitted,\\n\",\n",
|
||||||
|
" \"a:visited.sk-estimator-doc-link.fitted {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" border: var(--sklearn-color-fitted-level-1) 1pt solid;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-fitted-level-1);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* On hover */\\n\",\n",
|
||||||
|
" \"div.sk-estimator:hover .sk-estimator-doc-link:hover,\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link:hover,\\n\",\n",
|
||||||
|
" \"div.sk-label-container:hover .sk-estimator-doc-link:hover,\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link:hover {\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-3);\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" text-decoration: none;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"div.sk-estimator.fitted:hover .sk-estimator-doc-link.fitted:hover,\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link.fitted:hover,\\n\",\n",
|
||||||
|
" \"div.sk-label-container:hover .sk-estimator-doc-link.fitted:hover,\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link.fitted:hover {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-3);\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" text-decoration: none;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* Span, style for the box shown on hovering the info icon */\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link span {\\n\",\n",
|
||||||
|
" \" display: none;\\n\",\n",
|
||||||
|
" \" z-index: 9999;\\n\",\n",
|
||||||
|
" \" position: relative;\\n\",\n",
|
||||||
|
" \" font-weight: normal;\\n\",\n",
|
||||||
|
" \" right: .2ex;\\n\",\n",
|
||||||
|
" \" padding: .5ex;\\n\",\n",
|
||||||
|
" \" margin: .5ex;\\n\",\n",
|
||||||
|
" \" width: min-content;\\n\",\n",
|
||||||
|
" \" min-width: 20ex;\\n\",\n",
|
||||||
|
" \" max-width: 50ex;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-text);\\n\",\n",
|
||||||
|
" \" box-shadow: 2pt 2pt 4pt #999;\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background: var(--sklearn-color-unfitted-level-0);\\n\",\n",
|
||||||
|
" \" border: .5pt solid var(--sklearn-color-unfitted-level-3);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link.fitted span {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background: var(--sklearn-color-fitted-level-0);\\n\",\n",
|
||||||
|
" \" border: var(--sklearn-color-fitted-level-3);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \".sk-estimator-doc-link:hover span {\\n\",\n",
|
||||||
|
" \" display: block;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* \\\"?\\\"-specific style due to the `<a>` HTML tag */\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 a.estimator_doc_link {\\n\",\n",
|
||||||
|
" \" float: right;\\n\",\n",
|
||||||
|
" \" font-size: 1rem;\\n\",\n",
|
||||||
|
" \" line-height: 1em;\\n\",\n",
|
||||||
|
" \" font-family: monospace;\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" border-radius: 1rem;\\n\",\n",
|
||||||
|
" \" height: 1rem;\\n\",\n",
|
||||||
|
" \" width: 1rem;\\n\",\n",
|
||||||
|
" \" text-decoration: none;\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-unfitted-level-1);\\n\",\n",
|
||||||
|
" \" border: var(--sklearn-color-unfitted-level-1) 1pt solid;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 a.estimator_doc_link.fitted {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" border: var(--sklearn-color-fitted-level-1) 1pt solid;\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-fitted-level-1);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"/* On hover */\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 a.estimator_doc_link:hover {\\n\",\n",
|
||||||
|
" \" /* unfitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-unfitted-level-3);\\n\",\n",
|
||||||
|
" \" color: var(--sklearn-color-background);\\n\",\n",
|
||||||
|
" \" text-decoration: none;\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"#sk-container-id-1 a.estimator_doc_link.fitted:hover {\\n\",\n",
|
||||||
|
" \" /* fitted */\\n\",\n",
|
||||||
|
" \" background-color: var(--sklearn-color-fitted-level-3);\\n\",\n",
|
||||||
|
" \"}\\n\",\n",
|
||||||
|
" \"</style><div id=\\\"sk-container-id-1\\\" class=\\\"sk-top-container\\\"><div class=\\\"sk-text-repr-fallback\\\"><pre>MultinomialNB()</pre><b>In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook. <br />On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.</b></div><div class=\\\"sk-container\\\" hidden><div class=\\\"sk-item\\\"><div class=\\\"sk-estimator fitted sk-toggleable\\\"><input class=\\\"sk-toggleable__control sk-hidden--visually\\\" id=\\\"sk-estimator-id-1\\\" type=\\\"checkbox\\\" checked><label for=\\\"sk-estimator-id-1\\\" class=\\\"sk-toggleable__label fitted sk-toggleable__label-arrow\\\"><div><div>MultinomialNB</div></div><div><a class=\\\"sk-estimator-doc-link fitted\\\" rel=\\\"noreferrer\\\" target=\\\"_blank\\\" href=\\\"https://scikit-learn.org/1.6/modules/generated/sklearn.naive_bayes.MultinomialNB.html\\\">?<span>Documentation for MultinomialNB</span></a><span class=\\\"sk-estimator-doc-link fitted\\\">i<span>Fitted</span></span></div></label><div class=\\\"sk-toggleable__content fitted\\\"><pre>MultinomialNB()</pre></div> </div></div></div></div>\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" \"metadata\": {},\n",
|
||||||
|
" \"execution_count\": 15\n",
|
||||||
|
" }\n",
|
||||||
|
" ],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 5. MODEL KLASIFIKASI\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"model = MultinomialNB()\\n\",\n",
|
||||||
|
" \"model.fit(X, labels)\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 16,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"id\": \"ShevCTva2Fg9\",\n",
|
||||||
|
" \"colab\": {\n",
|
||||||
|
" \"base_uri\": \"https://localhost:8080/\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputId\": \"228e8f03-bcfb-4ecc-c36f-d86402530a5b\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [\n",
|
||||||
|
" {\n",
|
||||||
|
" \"output_type\": \"stream\",\n",
|
||||||
|
" \"name\": \"stdout\",\n",
|
||||||
|
" \"text\": [\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"Kalimat uji : saya suka belajar python\\n\",\n",
|
||||||
|
" \"Hasil klasifikasi : positif\\n\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" }\n",
|
||||||
|
" ],\n",
|
||||||
|
" \"source\": [\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"# 6. PREDIKSI DATA BARU\\n\",\n",
|
||||||
|
" \"# =========================\\n\",\n",
|
||||||
|
" \"test_sentence = [\\\"saya suka belajar python\\\"]\\n\",\n",
|
||||||
|
" \"test_sentence = [clean_text(test_sentence[0])]\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"X_test = vectorizer.transform(test_sentence)\\n\",\n",
|
||||||
|
" \"prediction = model.predict(X_test)\\n\",\n",
|
||||||
|
" \"\\n\",\n",
|
||||||
|
" \"print(\\\"\\\\nKalimat uji :\\\", test_sentence[0])\\n\",\n",
|
||||||
|
" \"print(\\\"Hasil klasifikasi :\\\", prediction[0])\"\n",
|
||||||
|
" ]\n",
|
||||||
|
" },\n",
|
||||||
|
" {\n",
|
||||||
|
" \"cell_type\": \"code\",\n",
|
||||||
|
" \"execution_count\": 16,\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"id\": \"NQjExannHuj0\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"outputs\": [],\n",
|
||||||
|
" \"source\": []\n",
|
||||||
|
" }\n",
|
||||||
|
" ],\n",
|
||||||
|
" \"metadata\": {\n",
|
||||||
|
" \"colab\": {\n",
|
||||||
|
" \"provenance\": []\n",
|
||||||
|
" },\n",
|
||||||
|
" \"kernelspec\": {\n",
|
||||||
|
" \"display_name\": \"Python 3 (ipykernel)\",\n",
|
||||||
|
" \"language\": \"python\",\n",
|
||||||
|
" \"name\": \"python3\"\n",
|
||||||
|
" },\n",
|
||||||
|
" \"language_info\": {\n",
|
||||||
|
" \"codemirror_mode\": {\n",
|
||||||
|
" \"name\": \"ipython\",\n",
|
||||||
|
" \"version\": 3\n",
|
||||||
|
" },\n",
|
||||||
|
" \"file_extension\": \".py\",\n",
|
||||||
|
" \"mimetype\": \"text/x-python\",\n",
|
||||||
|
" \"name\": \"python\",\n",
|
||||||
|
" \"nbconvert_exporter\": \"python\",\n",
|
||||||
|
" \"pygments_lexer\": \"ipython3\",\n",
|
||||||
|
" \"version\": \"3.12.2\"\n",
|
||||||
|
" }\n",
|
||||||
|
" },\n",
|
||||||
|
" \"nbformat\": 4,\n",
|
||||||
|
" \"nbformat_minor\": 0\n",
|
||||||
|
"}"
|
||||||
|
]
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
Loading…
x
Reference in New Issue
Block a user