Hack, Learn, Secure: Your Cybersecurity Playground

Home

AI Analyser2

Example – Email Spam Detection

TASK 2 : Model Steps – Spam Classification using Logistic Regression


          sudo apt install -y python3-pandas

          sudo apt install -y python3-numpy

          import numpy as np

          import pandas as pd
          
        

          sudo apt install -y python3-sklearn

          from sklearn.feature_extraction.text import CountVectorizer

          from sklearn.model_selection import train_test_split

          from sklearn.linear_model import LogisticRegression
          
        

          data = pd.read_csv('https://raw.githubusercontent.com/AiDevNepal/ai-saturdays-workshop-8/master/data/spam.csv')

          data['target'] = np.where(data['target']=='spam', 1, 0)
          
        

          X_train, X_test, Y_train, Y_test = train_test_split(data['text'], data['target'], random_state=0)

          vectorizer = CountVectorizer()

	    X_train_vectorized = vectorizer.fit_transform(X_train)

	    X_test_vectorized = vectorizer.transform(X_test)
          
        

          model = LogisticRegression(max_iter=1000)

          model.fit(X_train_vectorized, Y_train)