In [2]:
from sklearn.preprocessing import LabelEncoder
le = LabelEncoder()
le.fit([1, 2, 2, 6])
le.classes_
le.transform([1, 1, 2, 6])
le.inverse_transform([0, 0, 1, 2])

array([1, 1, 2, 6])

In [3]:
from sklearn.preprocessing import LabelEncoder

le = LabelEncoder()
print("LabelEncoder initialized.")

le.fit([1, 2, 2, 6])
print("Fitted classes:", le.classes_)

print("Transformed values:", le.transform([1, 1, 2, 6]))

print("Inverse transformed values:", le.inverse_transform([0, 0, 1, 2]))

LabelEncoder initialized.
Fitted classes: [1 2 6]
Transformed values: [0 0 1 2]
Inverse transformed values: [1 1 2 6]


In [4]:
from sklearn.preprocessing import LabelEncoder
import pandas as pd

# Sample dataset
data = pd.DataFrame({
    'Fruit': ['Apple', 'Banana', 'Orange', 'Apple', 'Orange', 'Banana'],
    'Price': [1.2, 0.5, 0.8, 1.3, 0.9, 0.6]
})

# Initialize and fit LabelEncoder
le = LabelEncoder()
data['Fruit_Encoded'] = le.fit_transform(data['Fruit'])

print(data)
print("Category Mapping:", le.classes_)


    Fruit  Price  Fruit_Encoded
0   Apple    1.2              0
1  Banana    0.5              1
2  Orange    0.8              2
3   Apple    1.3              0
4  Orange    0.9              2
5  Banana    0.6              1
Category Mapping: ['Apple' 'Banana' 'Orange']


In [5]:
data['Fruit_Encoded_Pandas'] = data['Fruit'].astype('category').cat.codes
print(data)
print("Category Mapping:", dict(enumerate(data['Fruit'].astype('category').cat.categories)))


    Fruit  Price  Fruit_Encoded  Fruit_Encoded_Pandas
0   Apple    1.2              0                     0
1  Banana    0.5              1                     1
2  Orange    0.8              2                     2
3   Apple    1.3              0                     0
4  Orange    0.9              2                     2
5  Banana    0.6              1                     1
Category Mapping: {0: 'Apple', 1: 'Banana', 2: 'Orange'}


In [6]:
data = pd.DataFrame({
    'Satisfaction': ['Low', 'High', 'Medium', 'Low', 'High'],
    'Score': [3, 8, 5, 2, 9]
})

satisfaction_order = {'Low': 0, 'Medium': 1, 'High': 2}
data['Satisfaction_Encoded'] = data['Satisfaction'].map(satisfaction_order)

print(data)


  Satisfaction  Score  Satisfaction_Encoded
0          Low      3                     0
1         High      8                     2
2       Medium      5                     1
3          Low      2                     0
4         High      9                     2


In [7]:
from sklearn.pipeline import Pipeline
from sklearn.tree import DecisionTreeClassifier

pipeline = Pipeline([
    ('label_encoding', LabelEncoder()),
    ('model', DecisionTreeClassifier())
])


In [8]:
train = pd.DataFrame({'City': ['Delhi', 'Mumbai', 'Chennai', 'Delhi']})
test = pd.DataFrame({'City': ['Mumbai', 'Kolkata']})

le = LabelEncoder()
train['City_Encoded'] = le.fit_transform(train['City'])

# Handle unseen category safely
test['City_Encoded'] = test['City'].apply(lambda x: le.transform([x])[0] if x in le.classes_ else -1)

print(train)
print(test)


      City  City_Encoded
0    Delhi             1
1   Mumbai             2
2  Chennai             0
3    Delhi             1
      City  City_Encoded
0   Mumbai             2
1  Kolkata            -1
