Copied!







from sklearn.feature_extraction.text import CountVectorizer
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline

vectorizer = CountVectorizer(binary=True)
classifier = LogisticRegression()
pipeline = Pipeline([("vectorizer", vectorizer),
                        ("classifier", classifier)])

from sklearn.feature_extraction.text import CountVectorizer
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline

vectorizer = CountVectorizer(binary=True)
classifier = LogisticRegression()
pipeline = Pipeline([("vectorizer", vectorizer),
                        ("classifier", classifier)])





Copied!







from sklearn.feature_extraction.text import CountVectorizer
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline

vectorizer = CountVectorizer(binary=True)
classifier = LogisticRegression()
pipeline = Pipeline([("vectorizer", vectorizer),
                        ("classifier", classifier)])

from sklearn.feature_extraction.text import CountVectorizer
from sklearn.linear_model import LogisticRegression
from sklearn.pipeline import Pipeline

vectorizer = CountVectorizer(binary=True)
classifier = LogisticRegression()
pipeline = Pipeline([("vectorizer", vectorizer),
                        ("classifier", classifier)])





Copied!







def train_the_pipeline(pipeline, X_train, y_train):
    pipeline.fit(X_train, y_train)
    return pipeline

def train_each_part_separately(vectorizer, classifier, X_train, y_train):
    X_train_vectorized = vectorizer.fit_transform(X_train)
    classifier.fit(X_train_vectorized, y_train)
    return vectorizer, classifier

def train_the_pipeline(pipeline, X_train, y_train):
    pipeline.fit(X_train, y_train)
    return pipeline

def train_each_part_separately(vectorizer, classifier, X_train, y_train):
    X_train_vectorized = vectorizer.fit_transform(X_train)
    classifier.fit(X_train_vectorized, y_train)
    return vectorizer, classifier





Copied!







def train_the_pipeline(pipeline, X_train, y_train):
    pipeline.fit(X_train, y_train)
    return pipeline

def train_each_part_separately(vectorizer, classifier, X_train, y_train):
    X_train_vectorized = vectorizer.fit_transform(X_train)
    classifier.fit(X_train_vectorized, y_train)
    return vectorizer, classifier

def train_the_pipeline(pipeline, X_train, y_train):
    pipeline.fit(X_train, y_train)
    return pipeline

def train_each_part_separately(vectorizer, classifier, X_train, y_train):
    X_train_vectorized = vectorizer.fit_transform(X_train)
    classifier.fit(X_train_vectorized, y_train)
    return vectorizer, classifier





Copied!







import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

df = pd.read_csv('https://raw.githubusercontent.com/tiagoft/NLP/refs/heads/main/wiki_movie_plots_drama_comedy.csv').sample(1000)
X_train, X_test, y_train, y_test = train_test_split(df['Plot'], df['Genre'], test_size=0.2, random_state=42)
vectorizer, classifier = train_each_part_separately(vectorizer, classifier, X_train, y_train)
X_vect = vectorizer.transform(X_test)
y_pred = classifier.predict(X_vect)
print(accuracy_score(y_test, y_pred))

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

df = pd.read_csv('https://raw.githubusercontent.com/tiagoft/NLP/refs/heads/main/wiki_movie_plots_drama_comedy.csv').sample(1000)
X_train, X_test, y_train, y_test = train_test_split(df['Plot'], df['Genre'], test_size=0.2, random_state=42)
vectorizer, classifier = train_each_part_separately(vectorizer, classifier, X_train, y_train)
X_vect = vectorizer.transform(X_test)
y_pred = classifier.predict(X_vect)
print(accuracy_score(y_test, y_pred))

0.71





Copied!







import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

df = pd.read_csv('https://raw.githubusercontent.com/tiagoft/NLP/refs/heads/main/wiki_movie_plots_drama_comedy.csv').sample(1000)
X_train, X_test, y_train, y_test = train_test_split(df['Plot'], df['Genre'], test_size=0.2, random_state=42)
vectorizer, classifier = train_each_part_separately(vectorizer, classifier, X_train, y_train)
X_vect = vectorizer.transform(X_test)
y_pred = classifier.predict(X_vect)
print(accuracy_score(y_test, y_pred))

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

df = pd.read_csv('https://raw.githubusercontent.com/tiagoft/NLP/refs/heads/main/wiki_movie_plots_drama_comedy.csv').sample(1000)
X_train, X_test, y_train, y_test = train_test_split(df['Plot'], df['Genre'], test_size=0.2, random_state=42)
vectorizer, classifier = train_each_part_separately(vectorizer, classifier, X_train, y_train)
X_vect = vectorizer.transform(X_test)
y_pred = classifier.predict(X_vect)
print(accuracy_score(y_test, y_pred))

0.71





Copied!







import torch.nn as nn
linear_layer = nn.Linear(in_features=3, out_features=1)
print(linear_layer)

import torch.nn as nn
linear_layer = nn.Linear(in_features=3, out_features=1)
print(linear_layer)

Linear(in_features=3, out_features=1, bias=True)





Copied!







import torch.nn as nn
linear_layer = nn.Linear(in_features=3, out_features=1)
print(linear_layer)

import torch.nn as nn
linear_layer = nn.Linear(in_features=3, out_features=1)
print(linear_layer)

Linear(in_features=3, out_features=1, bias=True)





Copied!







import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddmmBackward0>)
Parameter containing:
tensor([[ 0.4499, -0.2000, -0.2288]], requires_grad=True) Parameter containing:
tensor([-0.1976], requires_grad=True)
tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddBackward0>)





Copied!







import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddmmBackward0>)
Parameter containing:
tensor([[ 0.4499, -0.2000, -0.2288]], requires_grad=True) Parameter containing:
tensor([-0.1976], requires_grad=True)
tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddBackward0>)





Copied!







import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddmmBackward0>)
Parameter containing:
tensor([[ 0.4499, -0.2000, -0.2288]], requires_grad=True) Parameter containing:
tensor([-0.1976], requires_grad=True)
tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddBackward0>)





Copied!







import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

import torch
X = torch.tensor([[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]])

# We can call the linear_layer, and it will perform its operation:
output = linear_layer(X)
print(output)

# We can also access the weights and biases of the linear layer:
w = linear_layer.weight
b = linear_layer.bias
print(w, b)

# We can use these weights and biases to perform the operation manually:
z = X @ w.T + b
print(z)

tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddmmBackward0>)
Parameter containing:
tensor([[ 0.4499, -0.2000, -0.2288]], requires_grad=True) Parameter containing:
tensor([-0.1976], requires_grad=True)
tensor([[-0.8340],
        [-0.7707]], grad_fn=<AddBackward0>)





Copied!







logistic_w = classifier.coef_
logistic_b = classifier.intercept_

w = torch.tensor(logistic_w, dtype=torch.float32)
b = torch.tensor(logistic_b, dtype=torch.float32)

linear_layer.weight.data = w
linear_layer.bias.data = b

logistic_w = classifier.coef_
logistic_b = classifier.intercept_

w = torch.tensor(logistic_w, dtype=torch.float32)
b = torch.tensor(logistic_b, dtype=torch.float32)

linear_layer.weight.data = w
linear_layer.bias.data = b





Copied!







logistic_w = classifier.coef_
logistic_b = classifier.intercept_

w = torch.tensor(logistic_w, dtype=torch.float32)
b = torch.tensor(logistic_b, dtype=torch.float32)

linear_layer.weight.data = w
linear_layer.bias.data = b

logistic_w = classifier.coef_
logistic_b = classifier.intercept_

w = torch.tensor(logistic_w, dtype=torch.float32)
b = torch.tensor(logistic_b, dtype=torch.float32)

linear_layer.weight.data = w
linear_layer.bias.data = b





Copied!







X_vect_tensor = torch.tensor(X_vect.toarray(), dtype=torch.float32)
output = linear_layer(X_vect_tensor)
output_probs = torch.sigmoid(output)

X_vect_tensor = torch.tensor(X_vect.toarray(), dtype=torch.float32)
output = linear_layer(X_vect_tensor)
output_probs = torch.sigmoid(output)





Copied!







X_vect_tensor = torch.tensor(X_vect.toarray(), dtype=torch.float32)
output = linear_layer(X_vect_tensor)
output_probs = torch.sigmoid(output)

X_vect_tensor = torch.tensor(X_vect.toarray(), dtype=torch.float32)
output = linear_layer(X_vect_tensor)
output_probs = torch.sigmoid(output)





Copied!







y_probs = classifier.predict_proba(X_vect)
print(y_probs[:5])
print(output_probs[:5])

y_probs = classifier.predict_proba(X_vect)
print(y_probs[:5])
print(output_probs[:5])

[[0.00112143 0.99887857]
 [0.52950462 0.47049538]
 [0.01416174 0.98583826]
 [0.07480901 0.92519099]
 [0.65259003 0.34740997]]
tensor([[0.9989],
        [0.4705],
        [0.9858],
        [0.9252],
        [0.3474]], grad_fn=<SliceBackward0>)





Copied!







y_probs = classifier.predict_proba(X_vect)
print(y_probs[:5])
print(output_probs[:5])

y_probs = classifier.predict_proba(X_vect)
print(y_probs[:5])
print(output_probs[:5])

[[0.00112143 0.99887857]
 [0.52950462 0.47049538]
 [0.01416174 0.98583826]
 [0.07480901 0.92519099]
 [0.65259003 0.34740997]]
tensor([[0.9989],
        [0.4705],
        [0.9858],
        [0.9252],
        [0.3474]], grad_fn=<SliceBackward0>)





Copied!







binary_out = (output_probs > 0.5).numpy().astype(int)
binary_y = (y_test==classifier.classes_[1]).astype(int)
print(accuracy_score(binary_y, binary_out))

binary_out = (output_probs > 0.5).numpy().astype(int)
binary_y = (y_test==classifier.classes_[1]).astype(int)
print(accuracy_score(binary_y, binary_out))

0.71





Copied!







binary_out = (output_probs > 0.5).numpy().astype(int)
binary_y = (y_test==classifier.classes_[1]).astype(int)
print(accuracy_score(binary_y, binary_out))

binary_out = (output_probs > 0.5).numpy().astype(int)
binary_y = (y_test==classifier.classes_[1]).astype(int)
print(accuracy_score(binary_y, binary_out))

0.71





Copied!







# First, we prepare our data:
X_vect_train = torch.tensor(vectorizer.transform(X_train).toarray(), dtype=torch.float32)
y_train_ = (y_train == classifier.classes_[1]).astype(int).values
y_train_vect = torch.tensor( y_train_, dtype=torch.float32).reshape( -1, 1)

# First, we prepare our data:
X_vect_train = torch.tensor(vectorizer.transform(X_train).toarray(), dtype=torch.float32)
y_train_ = (y_train == classifier.classes_[1]).astype(int).values
y_train_vect = torch.tensor( y_train_, dtype=torch.float32).reshape( -1, 1)





Copied!







# First, we prepare our data:
X_vect_train = torch.tensor(vectorizer.transform(X_train).toarray(), dtype=torch.float32)
y_train_ = (y_train == classifier.classes_[1]).astype(int).values
y_train_vect = torch.tensor( y_train_, dtype=torch.float32).reshape( -1, 1)

# First, we prepare our data:
X_vect_train = torch.tensor(vectorizer.transform(X_train).toarray(), dtype=torch.float32)
y_train_ = (y_train == classifier.classes_[1]).astype(int).values
y_train_vect = torch.tensor( y_train_, dtype=torch.float32).reshape( -1, 1)





Copied!







# Let's start with a new linear layer:
clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)

# We will also define an optimizer:
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

print("Entering loop")
# And now, this is the training loop:
for epoch in range(5):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    print(loss.item())


# Let's start with a new linear layer:
clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)

# We will also define an optimizer:
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

print("Entering loop")
# And now, this is the training loop:
for epoch in range(5):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    print(loss.item())

Entering loop
201.01898193359375
197.97332763671875
195.9878387451172
194.46324157714844
193.14129638671875





Copied!







# Let's start with a new linear layer:
clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)

# We will also define an optimizer:
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

print("Entering loop")
# And now, this is the training loop:
for epoch in range(5):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    print(loss.item())


# Let's start with a new linear layer:
clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)

# We will also define an optimizer:
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

print("Entering loop")
# And now, this is the training loop:
for epoch in range(5):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    print(loss.item())

Entering loop
201.01898193359375
197.97332763671875
195.9878387451172
194.46324157714844
193.14129638671875





Copied!







X_vect_test = torch.tensor(vectorizer.transform(X_test).toarray(), dtype=torch.float32)
y_test_ = (y_test == classifier.classes_[1]).astype(int).values
with torch.no_grad():
    clf.eval()
    y_pred = (torch.sigmoid(clf(X_vect_test)) > 0.5).numpy().astype(int)
print(accuracy_score(y_test_, y_pred))

X_vect_test = torch.tensor(vectorizer.transform(X_test).toarray(), dtype=torch.float32)
y_test_ = (y_test == classifier.classes_[1]).astype(int).values
with torch.no_grad():
    clf.eval()
    y_pred = (torch.sigmoid(clf(X_vect_test)) > 0.5).numpy().astype(int)
print(accuracy_score(y_test_, y_pred))

0.585





Copied!







X_vect_test = torch.tensor(vectorizer.transform(X_test).toarray(), dtype=torch.float32)
y_test_ = (y_test == classifier.classes_[1]).astype(int).values
with torch.no_grad():
    clf.eval()
    y_pred = (torch.sigmoid(clf(X_vect_test)) > 0.5).numpy().astype(int)
print(accuracy_score(y_test_, y_pred))

X_vect_test = torch.tensor(vectorizer.transform(X_test).toarray(), dtype=torch.float32)
y_test_ = (y_test == classifier.classes_[1]).astype(int).values
with torch.no_grad():
    clf.eval()
    y_pred = (torch.sigmoid(clf(X_vect_test)) > 0.5).numpy().astype(int)
print(accuracy_score(y_test_, y_pred))

0.585





Copied!







from tqdm import tqdm # This will make us a progress bar

clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

# And now, a loop that is equal for everyone:
losses = []
for epoch in tqdm(range(100)):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    losses.append(loss.item())

from tqdm import tqdm # This will make us a progress bar

clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

# And now, a loop that is equal for everyone:
losses = []
for epoch in tqdm(range(100)):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    losses.append(loss.item())

100%|██████████| 100/100 [00:00<00:00, 182.95it/s]





Copied!







from tqdm import tqdm # This will make us a progress bar

clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

# And now, a loop that is equal for everyone:
losses = []
for epoch in tqdm(range(100)):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    losses.append(loss.item())

from tqdm import tqdm # This will make us a progress bar

clf = nn.Linear(in_features=len(vectorizer.vocabulary_), out_features=1)
optimizer = torch.optim.SGD(clf.parameters(), lr=1e-4) # lr is the learning rate - this is our alpha

# And now, a loop that is equal for everyone:
losses = []
for epoch in tqdm(range(100)):
    optimizer.zero_grad()
    output = clf(X_vect_train)
    output_probs = torch.sigmoid(output)
    loss = torch.sum( (output_probs-y_train_vect)**2 )
    loss.backward()
    optimizer.step()
    losses.append(loss.item())

100%|██████████| 100/100 [00:00<00:00, 182.95it/s]





Copied!







import matplotlib.pyplot as plt
plt.figure(figsize=(3,2))
plt.plot(losses)
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.show()

import matplotlib.pyplot as plt
plt.figure(figsize=(3,2))
plt.plot(losses)
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.show()





Copied!







import matplotlib.pyplot as plt
plt.figure(figsize=(3,2))
plt.plot(losses)
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.show()

import matplotlib.pyplot as plt
plt.figure(figsize=(3,2))
plt.plot(losses)
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.show()

Keys	Action
`?`	Open this help
`n`	Next page
`p`	Previous page
`s`	Search

Logistic Regression with Pytorch¶

Review: Logistic Regression with Scikit-Learn¶

Our first model with Pytorch¶

Exercise 1¶

A linear layer is a linear predictor?¶

How to train a Logistic Regression¶

Watching our training process¶

Exercise 2¶