IyBJbXBvcnRpbmcgbmVjZXNzYXJ5IGxpYnJhcmllcwppbXBvcnQgcGFuZGFzIGFzIHBkCmZyb20gc2tsZWFybi5mZWF0dXJlX2V4dHJhY3Rpb24udGV4dCBpbXBvcnQgVGZpZGZWZWN0b3JpemVyCmZyb20gc2tsZWFybi5tb2RlbF9zZWxlY3Rpb24gaW1wb3J0IHRyYWluX3Rlc3Rfc3BsaXQKZnJvbSBza2xlYXJuLmxpbmVhcl9tb2RlbCBpbXBvcnQgTG9naXN0aWNSZWdyZXNzaW9uCmZyb20gc2tsZWFybi5tZXRyaWNzIGltcG9ydCBhY2N1cmFjeV9zY29yZQoKIyBTYW1wbGUgZGF0YXNldCAocmVwbGFjZSB3aXRoIHlvdXIgZGF0YXNldCkKZGF0YSA9IHBkLkRhdGFGcmFtZSh7CiAgICAndGV4dCc6IFsmcXVvdDtJIGxvdmUgdGhpcyBtb3ZpZSEmcXVvdDssICZxdW90O1RoaXMgbW92aWUgaXMgdGVycmlibGUuJnF1b3Q7LCAmcXVvdDtOZXV0cmFsIHR3ZWV0IGFib3V0IHNvbWV0aGluZy4mcXVvdDtdLAogICAgJ3NlbnRpbWVudCc6IFsncG9zaXRpdmUnLCAnbmVnYXRpdmUnLCAnbmV1dHJhbCddCn0pCgojIFNwbGl0IGRhdGEgaW50byBmZWF0dXJlcyAoWCkgYW5kIHRhcmdldCAoeSkKWCA9IGRhdGFbJ3RleHQnXQp5ID0gZGF0YVsnc2VudGltZW50J10KCiMgVmVjdG9yaXplIHRleHQgZGF0YSB1c2luZyBURi1JREYgcmVwcmVzZW50YXRpb24KdmVjdG9yaXplciA9IFRmaWRmVmVjdG9yaXplcigpClhfdmVjdCA9IHZlY3Rvcml6ZXIuZml0X3RyYW5zZm9ybShYKQoKIyBTcGxpdCBkYXRhIGludG8gdHJhaW5pbmcgYW5kIHRlc3Rpbmcgc2V0cwpYX3RyYWluLCBYX3Rlc3QsIHlfdHJhaW4sIHlfdGVzdCA9IHRyYWluX3Rlc3Rfc3BsaXQoWF92ZWN0LCB5LCB0ZXN0X3NpemU9MC4yLCByYW5kb21fc3RhdGU9NDIpCgojIEJ1aWxkIGFuZCB0cmFpbiBMb2dpc3RpYyBSZWdyZXNzaW9uIG1vZGVsCm1vZGVsID0gTG9naXN0aWNSZWdyZXNzaW9uKCkKbW9kZWwuZml0KFhfdHJhaW4sIHlfdHJhaW4pCgojIEV2YWx1YXRlIG1vZGVsCnlfcHJlZCA9IG1vZGVsLnByZWRpY3QoWF90ZXN0KQphY2N1cmFjeSA9IGFjY3VyYWN5X3Njb3JlKHlfdGVzdCwgeV9wcmVkKQoKcHJpbnQoJnF1b3Q7QWNjdXJhY3k6JnF1b3Q7LCBhY2N1cmFjeSkK
# Importing necessary libraries
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score
# Sample dataset (replace with your dataset)
data = pd.DataFrame({
'text': ["I love this movie!", "This movie is terrible.", "Neutral tweet about something."],
'sentiment': ['positive', 'negative', 'neutral']
})
# Split data into features (X) and target (y)
X = data['text']
y = data['sentiment']
# Vectorize text data using TF-IDF representation
vectorizer = TfidfVectorizer()
X_vect = vectorizer.fit_transform(X)
# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X_vect, y, test_size=0.2, random_state=42)
# Build and train Logistic Regression model
model = LogisticRegression()
model.fit(X_train, y_train)
# Evaluate model
y_pred = model.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)