# Word Embeddings

In [11]:
import pandas as pd
import numpy as np
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.preprocessing import MinMaxScaler
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import f1_score
from sklearn.model_selection import GridSearchCV
from sklearn.naive_bayes import ComplementNB
from sklearn.svm import LinearSVC
from sklearn.ensemble import RandomForestClassifier
from sklearn.dummy import DummyClassifier
import gensim.downloader as api
from gensim.models import KeyedVectors
import gensim

In [2]:
test_df = pd.read_csv("../../data/prepared/test.csv")
train_df = pd.read_csv("../../data/prepared/train.csv")
valid_df = pd.read_csv("../../data/prepared/valid.csv")
unlabeled_df = pd.read_csv("../../data/prepared/unlabeled.csv")
bigger_train_df = pd.concat([train_df, valid_df], ignore_index=True)
results = {}

## Most Common and Stratified Baselines

In [3]:
baseline_classifier = DummyClassifier(strategy='most_frequent', random_state=42)
baseline_classifier.fit(train_df["problem_abstract"], train_df["team"])
y_pred = baseline_classifier.predict(test_df["problem_abstract"])
results["dummy most common"] = f1_score(test_df["team"], y_pred, average='micro')
print("F1-micro Score on Test Set:", results["dummy most common"])

baseline_classifier = DummyClassifier(strategy='stratified', random_state=42)
baseline_classifier.fit(train_df["problem_abstract"], train_df["team"])
y_pred = baseline_classifier.predict(test_df["problem_abstract"])
results["dummy stratified"] = f1_score(test_df["team"], y_pred, average='micro')
print("F1-micro Score on Test Set:", results["dummy stratified"])

F1-micro Score on Test Set: 0.3333333333333333
F1-micro Score on Test Set: 0.18984547461368653


## Log Regression

In [4]:


# Function to convert text into averaged word embeddings
def text_to_avg_vector(text, model):
    words = text.split()
    words_in_vocab = [word for word in words if word in model.key_to_index]
    if len(words_in_vocab) == 0:
        return np.zeros(model.vector_size)
    avg_vector = np.mean([model[word] for word in words_in_vocab], axis=0)
    return avg_vector

def transform_with_embeddings(df, model):
    return np.array(df['problem_abstract'].apply(lambda s: text_to_avg_vector("" if s is None or pd.isna(s) else s, model)).tolist())

word2vec_model = KeyedVectors.load_word2vec_format('../../models/GoogleNews-vectors-negative300.bin', binary=True)
glove_model = KeyedVectors.load_word2vec_format('../../models/glove.840B.300d.txt', binary=False, no_header=True)
# Transform train and test data
X_train_word2vec = transform_with_embeddings(train_df, word2vec_model)
X_train_glove = transform_with_embeddings(train_df, glove_model)
y_train = train_df['team']
X_test_word2vec = transform_with_embeddings(test_df, word2vec_model)
X_test_glove = transform_with_embeddings(test_df, glove_model)
y_test = test_df['team']

In [5]:
def finetune(X_train, y_train, model, param_grid, metric, cv=5, verbose=2):

    grid_search = GridSearchCV(model, param_grid, cv=5, scoring=metric, verbose=verbose)
    grid_search.fit(X_train, y_train)
    best_model = grid_search.best_estimator_
    best_params = grid_search.best_params_
    return best_model, best_params

def evaluate(X_test, y_test, model):

    y_pred = model.predict(X_test)
    metric = f1_score(y_test, y_pred, average="micro")
    return metric

In [6]:
model, model_params = finetune(
    X_train_word2vec, 
    y_train,
    LogisticRegression(random_state=42, penalty="elasticnet", class_weight="balanced", n_jobs=-1, solver="saga"),
    {
        "C": [0.01, 0.1, 1.0, 10.0],
        "l1_ratio": [0.0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]
    },
    "f1_micro",
    cv=5,
    verbose=2
    )
print("Best Hyperparameters:", model_params)
results["logistic regression word2vec"] = evaluate(X_test_word2vec, y_test, model)
print("F1-micro Score on Test Set:", results["logistic regression word2vec"])

Fitting 5 folds for each of 44 candidates, totalling 220 fits




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=   5.5s
[CV] END ...............................C=0.01, l1_ratio=0.0; total time=   6.6s
[CV] END ...............................C=0.01, l1_ratio=0.0; total time=   4.8s
[CV] END ...............................C=0.01, l1_ratio=0.0; total time=   6.3s
[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  11.0s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   6.1s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   4.8s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   6.4s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   9.1s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   9.1s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   2.7s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   4.8s
[CV] END ...................



[CV] END ................................C=0.1, l1_ratio=0.0; total time=  30.0s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  32.9s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  35.3s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  34.6s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  33.3s




[CV] END ................................C=0.1, l1_ratio=0.1; total time= 1.2min




[CV] END ................................C=0.1, l1_ratio=0.1; total time= 1.3min




[CV] END ................................C=0.1, l1_ratio=0.1; total time= 1.3min




[CV] END ................................C=0.1, l1_ratio=0.1; total time= 1.3min




[CV] END ................................C=0.1, l1_ratio=0.1; total time= 1.3min




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  53.0s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  54.8s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  53.6s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  59.8s




[CV] END ................................C=0.1, l1_ratio=0.2; total time= 1.0min




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  47.1s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  52.5s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  54.4s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  46.2s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  42.0s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  38.3s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  41.3s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  42.3s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  37.1s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  36.0s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  38.8s
[CV] END ................................C=0.1, l1_ratio=0.5; total time=  13.0s
[CV] END ................................C=0.1, l1_ratio=0.5; total time=  14.1s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  39.5s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  39.5s
[CV] END ................................C=0.1, l1_ratio=0.6; total time=  13.3s
[CV] END ................................C=0.1, l1_ratio=0.6; total time=  15.2s
[CV] END ................................C=0.1, l1_ratio=0.6; total time=  14.0s
[CV] END ................................C=0.1, l1_ratio=0.6; total time=  23.2s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  31.8s
[CV] END ................................C=0.1, l1_ratio=0.7; total time=  13.6s
[CV] END ................................C=0.1, l1_ratio=0.7; total time=  17.7s
[CV] END ................................C=0.1, l1_ratio=0.7; total time=  13.1s
[CV] END ................................C=0.1, l1_ratio=0.7; total time=  17.6s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  26.7s
[CV] END ................................C=0.1, l1_ratio=0.8; total time=  20.8s
[CV] END ................................C=0.1, l1_ratio=0.8; total time=  21.2s
[CV] END ................................C=0.1, l1_ratio=0.8; total time=  20.0s
[CV] END ................................C=0.1, l1_ratio=0.8; total time=  21.5s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  37.7s
[CV] END ................................C=0.1, l1_ratio=0.9; total time=  29.5s
[CV] END ................................C=0.1, l1_ratio=0.9; total time=  21.7s
[CV] END ................................C=0.1, l1_ratio=0.9; total time=  22.5s
[CV] END ................................C=0.1, l1_ratio=0.9; total time=  33.3s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  39.3s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  40.6s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  42.8s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  38.6s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  34.2s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  37.2s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  28.7s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  26.8s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  29.6s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  28.7s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  26.1s




[CV] END ................................C=1.0, l1_ratio=0.1; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.1; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.1; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.1; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.1; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.2; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.2; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.2; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.2; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.2; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.3; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.3; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.3; total time= 1.4min




[CV] END ................................C=1.0, l1_ratio=0.3; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.3; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.4; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.4; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.4; total time= 1.3min




[CV] END ................................C=1.0, l1_ratio=0.4; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.4; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.5; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.5; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.5; total time= 1.2min




[CV] END ................................C=1.0, l1_ratio=0.5; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.5; total time= 1.1min




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  56.0s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  57.8s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  59.5s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  55.8s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  55.1s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  45.9s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  47.2s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  53.7s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  47.0s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  47.9s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  42.6s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  44.1s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  48.6s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  42.0s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  40.3s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  37.0s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  36.9s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  41.0s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  40.2s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  37.7s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  32.1s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  33.6s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  38.2s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  36.3s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  37.7s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  19.1s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  18.1s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  20.3s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  20.1s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  19.4s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  49.4s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  48.0s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  51.2s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  50.7s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  49.2s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  46.1s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  47.3s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  50.3s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  50.6s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  50.2s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  47.8s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  47.2s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  52.9s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  52.1s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  51.1s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  51.4s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  51.3s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  56.5s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time= 1.0min




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  56.1s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  54.9s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  53.4s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  57.8s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  58.8s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  54.9s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  50.3s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  50.1s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  56.4s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  59.0s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  55.0s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  49.6s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  51.0s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  55.6s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  58.1s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  54.1s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  50.0s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  50.2s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  52.9s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  54.3s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  51.0s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  46.7s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  47.1s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  51.5s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  50.9s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  49.7s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  44.0s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  44.0s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  48.9s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  48.1s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  46.7s
Best Hyperparameters: {'C': 10.0, 'l1_ratio': 0.5}
F1-micro Score on Test Set: 0.5342163355408388




In [7]:
model, model_params = finetune(
    X_train_glove, 
    y_train,
    LogisticRegression(random_state=42, penalty="elasticnet", class_weight="balanced", n_jobs=-1, solver="saga"),
    {
        "C": [0.01, 0.1, 1.0, 10.0],
        "l1_ratio": [0.0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]
    },
    "f1_micro",
    cv=5,
    verbose=2
    )
print("Best Hyperparameters:", model_params)
results["logistic regression glove"] = evaluate(X_test_glove, y_test, model)
print("F1-micro Score on Test Set:", results["logistic regression glove"])



Fitting 5 folds for each of 44 candidates, totalling 220 fits




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  17.1s




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  17.6s




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  18.0s




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  17.8s




[CV] END ...............................C=0.01, l1_ratio=0.0; total time=  18.3s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   7.8s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   6.4s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   6.3s
[CV] END ...............................C=0.01, l1_ratio=0.1; total time=   6.6s




[CV] END ...............................C=0.01, l1_ratio=0.1; total time=  22.4s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   3.8s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   5.4s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   4.4s
[CV] END ...............................C=0.01, l1_ratio=0.2; total time=   6.1s




[CV] END ...............................C=0.01, l1_ratio=0.2; total time=  20.6s
[CV] END ...............................C=0.01, l1_ratio=0.3; total time=   3.7s
[CV] END ...............................C=0.01, l1_ratio=0.3; total time=   3.6s
[CV] END ...............................C=0.01, l1_ratio=0.3; total time=   3.6s
[CV] END ...............................C=0.01, l1_ratio=0.3; total time=   5.5s
[CV] END ...............................C=0.01, l1_ratio=0.3; total time=   6.0s
[CV] END ...............................C=0.01, l1_ratio=0.4; total time=   3.8s
[CV] END ...............................C=0.01, l1_ratio=0.4; total time=   3.7s
[CV] END ...............................C=0.01, l1_ratio=0.4; total time=   4.5s
[CV] END ...............................C=0.01, l1_ratio=0.4; total time=   5.3s
[CV] END ...............................C=0.01, l1_ratio=0.4; total time=   4.7s
[CV] END ...............................C=0.01, l1_ratio=0.5; total time=   3.5s
[CV] END ...................



[CV] END ................................C=0.1, l1_ratio=0.0; total time=  16.4s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  17.3s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  17.1s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  17.5s




[CV] END ................................C=0.1, l1_ratio=0.0; total time=  17.7s




[CV] END ................................C=0.1, l1_ratio=0.1; total time=  52.8s




[CV] END ................................C=0.1, l1_ratio=0.1; total time=  52.1s




[CV] END ................................C=0.1, l1_ratio=0.1; total time=  56.7s




[CV] END ................................C=0.1, l1_ratio=0.1; total time=  56.1s




[CV] END ................................C=0.1, l1_ratio=0.1; total time=  55.5s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  39.9s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  40.3s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  42.7s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  41.6s




[CV] END ................................C=0.1, l1_ratio=0.2; total time=  41.2s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  30.1s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  31.5s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  32.6s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  31.2s




[CV] END ................................C=0.1, l1_ratio=0.3; total time=  33.3s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  27.0s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  27.6s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  28.9s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  27.1s




[CV] END ................................C=0.1, l1_ratio=0.4; total time=  27.2s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  25.4s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  26.4s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  25.9s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  26.0s




[CV] END ................................C=0.1, l1_ratio=0.5; total time=  25.0s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  23.3s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  24.8s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  24.2s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  23.5s




[CV] END ................................C=0.1, l1_ratio=0.6; total time=  23.0s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  21.5s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  22.3s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  22.8s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  23.1s




[CV] END ................................C=0.1, l1_ratio=0.7; total time=  22.3s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  21.1s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  21.9s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  22.4s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  22.5s




[CV] END ................................C=0.1, l1_ratio=0.8; total time=  21.8s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  20.7s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  21.2s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  22.0s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  22.3s




[CV] END ................................C=0.1, l1_ratio=0.9; total time=  21.5s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  20.5s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  20.9s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  22.1s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  22.0s




[CV] END ................................C=0.1, l1_ratio=1.0; total time=  21.2s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  14.8s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  15.1s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  16.1s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  16.1s




[CV] END ................................C=1.0, l1_ratio=0.0; total time=  15.4s




[CV] END ................................C=1.0, l1_ratio=0.1; total time=  41.0s




[CV] END ................................C=1.0, l1_ratio=0.1; total time=  42.2s




[CV] END ................................C=1.0, l1_ratio=0.1; total time=  46.6s




[CV] END ................................C=1.0, l1_ratio=0.1; total time=  46.5s




[CV] END ................................C=1.0, l1_ratio=0.1; total time=  44.3s




[CV] END ................................C=1.0, l1_ratio=0.2; total time=  46.4s




[CV] END ................................C=1.0, l1_ratio=0.2; total time=  47.4s




[CV] END ................................C=1.0, l1_ratio=0.2; total time=  52.9s




[CV] END ................................C=1.0, l1_ratio=0.2; total time=  52.6s




[CV] END ................................C=1.0, l1_ratio=0.2; total time=  50.1s




[CV] END ................................C=1.0, l1_ratio=0.3; total time=  48.1s




[CV] END ................................C=1.0, l1_ratio=0.3; total time=  48.8s




[CV] END ................................C=1.0, l1_ratio=0.3; total time=  54.3s




[CV] END ................................C=1.0, l1_ratio=0.3; total time=  53.9s




[CV] END ................................C=1.0, l1_ratio=0.3; total time=  50.7s




[CV] END ................................C=1.0, l1_ratio=0.4; total time=  46.1s




[CV] END ................................C=1.0, l1_ratio=0.4; total time=  46.4s




[CV] END ................................C=1.0, l1_ratio=0.4; total time=  52.9s




[CV] END ................................C=1.0, l1_ratio=0.4; total time=  51.7s




[CV] END ................................C=1.0, l1_ratio=0.4; total time=  47.9s




[CV] END ................................C=1.0, l1_ratio=0.5; total time=  42.6s




[CV] END ................................C=1.0, l1_ratio=0.5; total time=  43.8s




[CV] END ................................C=1.0, l1_ratio=0.5; total time=  49.5s




[CV] END ................................C=1.0, l1_ratio=0.5; total time=  48.1s




[CV] END ................................C=1.0, l1_ratio=0.5; total time=  44.3s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  38.9s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  40.0s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  46.2s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  42.5s




[CV] END ................................C=1.0, l1_ratio=0.6; total time=  35.2s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  31.4s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  32.7s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  37.7s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  35.9s




[CV] END ................................C=1.0, l1_ratio=0.7; total time=  32.5s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  29.5s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  30.7s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  34.3s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  32.6s




[CV] END ................................C=1.0, l1_ratio=0.8; total time=  30.1s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  27.5s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  28.5s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  32.4s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  30.9s




[CV] END ................................C=1.0, l1_ratio=0.9; total time=  28.6s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  26.9s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  27.3s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  30.6s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  29.3s




[CV] END ................................C=1.0, l1_ratio=1.0; total time=  27.2s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  12.4s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  12.7s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  13.6s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  13.5s




[CV] END ...............................C=10.0, l1_ratio=0.0; total time=  13.0s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  33.4s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  34.5s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  37.2s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  37.6s




[CV] END ...............................C=10.0, l1_ratio=0.1; total time=  35.8s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  34.6s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  35.3s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  39.8s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  39.4s




[CV] END ...............................C=10.0, l1_ratio=0.2; total time=  37.9s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  36.2s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  37.4s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  42.2s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  41.6s




[CV] END ...............................C=10.0, l1_ratio=0.3; total time=  40.0s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  37.7s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  38.5s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  43.2s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  42.7s




[CV] END ...............................C=10.0, l1_ratio=0.4; total time=  41.1s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  38.1s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  39.1s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  43.3s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  43.2s




[CV] END ...............................C=10.0, l1_ratio=0.5; total time=  41.3s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  38.2s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  39.4s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  43.0s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  43.2s




[CV] END ...............................C=10.0, l1_ratio=0.6; total time=  41.2s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  38.2s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  39.0s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  42.5s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  42.8s




[CV] END ...............................C=10.0, l1_ratio=0.7; total time=  41.0s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  37.5s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  38.1s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  41.3s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  42.2s




[CV] END ...............................C=10.0, l1_ratio=0.8; total time=  40.4s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  36.8s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  37.1s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  40.1s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  41.2s




[CV] END ...............................C=10.0, l1_ratio=0.9; total time=  39.5s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  35.8s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  36.2s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  38.8s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  40.1s




[CV] END ...............................C=10.0, l1_ratio=1.0; total time=  38.6s
Best Hyperparameters: {'C': 10.0, 'l1_ratio': 0.0}
F1-micro Score on Test Set: 0.565121412803532




## Naive Bayes

In [13]:
scaler_word2vec = MinMaxScaler()
scaler_word2vec.fit(X_train_word2vec)
model, model_params = finetune(
    X_train_word2vec, 
    y_train,
    ComplementNB(),
    {
        "norm": [True, False],
        "alpha": [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0],
        
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["naive bayes word2vec"] = evaluate(X_test_word2vec, y_test, model)
print("F1-micro Score on Test Set:", results["naive bayes word2vec"])

Fitting 5 folds for each of 20 candidates, totalling 100 fits
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ...............................alpha=0.2, norm=True; total time=   0.0s
[CV] END ...............................alpha=0



[CV] END ..............................alpha=0.3, norm=False; total time=   0.0s
[CV] END ...............................alpha=0.4, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.4, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.4, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.4, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.4, norm=True; total time=   0.0s
[CV] END ..............................alpha=0.4, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.4, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.4, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.4, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.4, norm=False; total time=   0.0s
[CV] END ...............................alpha=0.5, norm=True; total time=   0.0s
[CV] END ...................

ValueError: 
All the 100 fits failed.
It is very likely that your model is misconfigured.
You can try to debug the error by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
100 fits failed with the following error:
Traceback (most recent call last):
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/model_selection/_validation.py", line 732, in _fit_and_score
    estimator.fit(X_train, y_train, **fit_params)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/base.py", line 1151, in wrapper
    return fit_method(estimator, *args, **kwargs)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/naive_bayes.py", line 772, in fit
    self._count(X, Y)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/naive_bayes.py", line 1040, in _count
    check_non_negative(X, "ComplementNB (input X)")
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/utils/validation.py", line 1490, in check_non_negative
    raise ValueError("Negative values in data passed to %s" % whom)
ValueError: Negative values in data passed to ComplementNB (input X)


In [14]:
scaler_glove = MinMaxScaler()
scaler_glove.fit(X_train_glove)
model, model_params = finetune(
    scaler_glove.transform(X_train_glove), 
    y_train,
    ComplementNB(),
    {
        "norm": [True, False],
        "alpha": [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0],
        
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["naive bayes glove"] = evaluate(scaler_glove.transform(X_test_glove), y_test, model)
print("F1-micro Score on Test Set:", results["naive bayes glove"])

Fitting 5 folds for each of 20 candidates, totalling 100 fits
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.1, norm=True; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.1, norm=False; total time=   0.0s
[CV] END ...............................alpha=0.2, norm=True; total time=   0.0s
[CV] END ...............................alpha=0



[CV] END ...............................alpha=0.2, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.2, norm=True; total time=   0.0s
[CV] END ..............................alpha=0.2, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.2, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.2, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.2, norm=False; total time=   0.0s
[CV] END ..............................alpha=0.2, norm=False; total time=   0.0s
[CV] END ...............................alpha=0.3, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.3, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.3, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.3, norm=True; total time=   0.0s
[CV] END ...............................alpha=0.3, norm=True; total time=   0.0s
[CV] END ...................

## Linear SVM

In [15]:
model, model_params = finetune(
    X_train_word2vec, 
    y_train,
    LinearSVC(loss="squared_hinge", class_weight="balanced", random_state=42),
    {
        "penalty": ["l1", "l2"],
        "C": [0.001, 0.01, 0.1, 1.0, 10.0, 100],
        "intercept_scaling": [0.001, 0.01, 0.1, 1.0, 10.0, 100]
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["linear svm word2vec"] = evaluate(X_test_word2vec, y_test, model)
print("F1-micro Score on Test Set:", results["linear svm word2vec"])

Fitting 5 folds for each of 72 candidates, totalling 360 fits
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.7s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.7s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.6s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.7s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.6s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.7s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.6s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.6s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.7s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.9s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.8s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.8s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  34.8s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  35.4s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  37.2s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  37.2s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  36.3s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.5s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.5s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.5s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   5.6s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   6.0s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   6.6s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   6.5s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   6.1s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  40.1s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  40.8s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  42.8s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  42.4s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  42.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.6s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.6s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.5s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.7s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.7s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.7s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.6s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   8.7s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   8.6s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   8.8s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   8.8s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   8.7s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  32.7s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  33.0s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  34.1s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  34.3s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  33.6s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   0.8s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   0.8s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   0.9s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   0.8s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   0.9s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   0.8s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   0.9s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   0.9s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   0.8s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   0.8s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   0.9s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.0s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.1s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.0s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.1s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   8.0s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   8.0s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   8.1s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   8.2s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   8.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  28.6s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  29.0s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  29.7s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  29.6s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  28.5s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   2.2s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   2.9s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   2.3s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   2.9s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   2.7s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   2.4s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   2.8s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   2.3s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   2.8s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   2.6s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   2.4s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   2.8s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   2.3s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   2.8s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   2.7s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   2.8s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.1s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   2.7s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.1s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   7.7s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   7.7s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   7.8s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   7.8s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   7.8s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  28.3s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  27.7s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  28.6s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  28.6s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  28.5s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.3s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.3s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.3s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.4s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.4s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.2s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.3s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.4s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.4s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.4s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.2s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.2s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.3s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.2s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.2s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.5s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   7.8s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   7.8s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   7.9s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   8.0s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   7.8s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  27.6s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  27.1s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  28.4s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  29.1s


180 fits failed out of a total of 360.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
180 fits failed with the following error:
Traceback (most recent call last):
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/model_selection/_validation.py", line 732, in _fit_and_score
    estimator.fit(X_train, y_train, **fit_params)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/base.py", line 1151, in wrapper
    return fit_method(estimator, *args, **kwargs)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/svm/_classes.py", line 315,

[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  28.3s
Best Hyperparameters: {'C': 0.1, 'intercept_scaling': 100, 'penalty': 'l2'}
F1-micro Score on Test Set: 0.6136865342163356




In [16]:
model, model_params = finetune(
    X_train_glove, 
    y_train,
    LinearSVC(loss="squared_hinge", class_weight="balanced", random_state=42),
    {
        "penalty": ["l1", "l2"],
        "C": [0.001, 0.01, 0.1, 1.0, 10.0, 100],
        "intercept_scaling": [0.001, 0.01, 0.1, 1.0, 10.0, 100]
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["linear svm glove"] = evaluate(X_test_glove, y_test, model)
print("F1-micro Score on Test Set:", results["linear svm glove"])



Fitting 5 folds for each of 72 candidates, totalling 360 fits
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.5s




[CV] END .......C=0.001, intercept_scaling=0.001, penalty=l2; total time=   0.5s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.5s




[CV] END ........C=0.001, intercept_scaling=0.01, penalty=l2; total time=   0.5s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=0.1, penalty=l2; total time=   0.5s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s




[CV] END .........C=0.001, intercept_scaling=1.0, penalty=l2; total time=   0.5s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.3s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.4s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.5s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.5s




[CV] END ........C=0.001, intercept_scaling=10.0, penalty=l2; total time=   1.4s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END .........C=0.001, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  29.2s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  29.6s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  31.4s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  31.3s




[CV] END .........C=0.001, intercept_scaling=100, penalty=l2; total time=  30.4s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.6s




[CV] END ........C=0.01, intercept_scaling=0.001, penalty=l2; total time=   0.6s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.6s




[CV] END .........C=0.01, intercept_scaling=0.01, penalty=l2; total time=   0.6s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=0.1, penalty=l2; total time=   0.6s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.7s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.7s




[CV] END ..........C=0.01, intercept_scaling=1.0, penalty=l2; total time=   0.6s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   2.7s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   2.8s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   3.0s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   2.9s




[CV] END .........C=0.01, intercept_scaling=10.0, penalty=l2; total time=   2.8s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=0.01, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  26.5s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  27.0s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  27.7s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  27.5s




[CV] END ..........C=0.01, intercept_scaling=100, penalty=l2; total time=  27.3s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.9s




[CV] END .........C=0.1, intercept_scaling=0.001, penalty=l2; total time=   0.9s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.9s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.9s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.8s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.9s




[CV] END ..........C=0.1, intercept_scaling=0.01, penalty=l2; total time=   0.9s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=0.1, penalty=l2; total time=   0.9s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.9s




[CV] END ...........C=0.1, intercept_scaling=1.0, penalty=l2; total time=   0.9s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   4.5s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   4.3s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   4.4s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   4.3s




[CV] END ..........C=0.1, intercept_scaling=10.0, penalty=l2; total time=   4.1s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=0.1, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  22.6s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  22.2s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  22.5s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  22.6s




[CV] END ...........C=0.1, intercept_scaling=100, penalty=l2; total time=  22.4s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   2.1s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   2.0s
[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   1.9s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   2.1s




[CV] END .........C=1.0, intercept_scaling=0.001, penalty=l2; total time=   2.1s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   2.1s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   2.1s
[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   1.8s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   2.2s




[CV] END ..........C=1.0, intercept_scaling=0.01, penalty=l2; total time=   2.1s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   2.2s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   2.1s
[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   1.8s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   2.1s




[CV] END ...........C=1.0, intercept_scaling=0.1, penalty=l2; total time=   2.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.9s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   2.0s
[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.9s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   2.0s




[CV] END ...........C=1.0, intercept_scaling=1.0, penalty=l2; total time=   1.9s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   5.5s




[CV] END ..........C=1.0, intercept_scaling=10.0, penalty=l2; total time=   5.4s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=1.0, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  21.3s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  21.3s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  21.9s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  22.0s




[CV] END ...........C=1.0, intercept_scaling=100, penalty=l2; total time=  21.7s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   3.9s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   4.0s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   3.7s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   3.9s




[CV] END ........C=10.0, intercept_scaling=0.001, penalty=l2; total time=   3.9s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   4.0s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   4.0s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   3.7s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   3.9s




[CV] END .........C=10.0, intercept_scaling=0.01, penalty=l2; total time=   3.9s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   3.9s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   3.9s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   3.6s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   3.9s




[CV] END ..........C=10.0, intercept_scaling=0.1, penalty=l2; total time=   3.9s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.6s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.5s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.5s




[CV] END ..........C=10.0, intercept_scaling=1.0, penalty=l2; total time=   3.5s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   5.3s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   5.3s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   5.3s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   5.3s




[CV] END .........C=10.0, intercept_scaling=10.0, penalty=l2; total time=   5.2s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ..........C=10.0, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  21.4s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  21.3s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  21.7s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  21.6s




[CV] END ..........C=10.0, intercept_scaling=100, penalty=l2; total time=  21.9s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s
[CV] END .........C=100, intercept_scaling=0.001, penalty=l1; total time=   0.0s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.8s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.8s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.6s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.8s




[CV] END .........C=100, intercept_scaling=0.001, penalty=l2; total time=   3.7s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=0.01, penalty=l1; total time=   0.0s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.6s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.8s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.6s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.8s




[CV] END ..........C=100, intercept_scaling=0.01, penalty=l2; total time=   3.7s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=0.1, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.7s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.6s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.6s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.6s




[CV] END ...........C=100, intercept_scaling=0.1, penalty=l2; total time=   3.7s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=1.0, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.3s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s




[CV] END ...........C=100, intercept_scaling=1.0, penalty=l2; total time=   3.4s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s
[CV] END ..........C=100, intercept_scaling=10.0, penalty=l1; total time=   0.0s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   5.3s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   5.4s




[CV] END ..........C=100, intercept_scaling=10.0, penalty=l2; total time=   5.3s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s
[CV] END ...........C=100, intercept_scaling=100, penalty=l1; total time=   0.0s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  21.4s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  20.8s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  21.7s




[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  21.6s


180 fits failed out of a total of 360.
The score on these train-test partitions for these parameters will be set to nan.
If these failures are not expected, you can try to debug them by setting error_score='raise'.

Below are more details about the failures:
--------------------------------------------------------------------------------
180 fits failed with the following error:
Traceback (most recent call last):
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/model_selection/_validation.py", line 732, in _fit_and_score
    estimator.fit(X_train, y_train, **fit_params)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/base.py", line 1151, in wrapper
    return fit_method(estimator, *args, **kwargs)
  File "/var/tmp/xmacko1/bachelor_thesis/.pyenv/versions/3.8.9/envs/ticketing-system/lib/python3.8/site-packages/sklearn/svm/_classes.py", line 315,

[CV] END ...........C=100, intercept_scaling=100, penalty=l2; total time=  21.5s
Best Hyperparameters: {'C': 100, 'intercept_scaling': 10.0, 'penalty': 'l2'}
F1-micro Score on Test Set: 0.5905077262693157




## Random Forest

In [17]:
model, model_params = finetune(
    X_train_word2vec, 
    y_train,
    RandomForestClassifier(class_weight="balanced", random_state=42, n_jobs=-1),
    {
        "min_samples_split": [2, 4, 6, 8, 10, 12, 14, 16, 18, 20],
        "min_samples_leaf": [2, 4, 6, 8, 10, 12, 14, 16, 18, 20],
        "max_samples": [0.6, 0.7, 0.8, 0.9, 1.0]
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["random forest word2vec"] = evaluate(X_test_word2vec, y_test, model)
print("F1-micro Score on Test Set:", results["random forest word2vec"])



Fitting 5 folds for each of 500 candidates, totalling 2500 fits
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.5s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=6; total tim

In [18]:
model, model_params = finetune(
    X_train_glove, 
    y_train,
    RandomForestClassifier(class_weight="balanced", random_state=42, n_jobs=-1),
    {
        "min_samples_split": [2, 4, 6, 8, 10, 12, 14, 16, 18, 20],
        "min_samples_leaf": [2, 4, 6, 8, 10, 12, 14, 16, 18, 20],
        "max_samples": [0.6, 0.7, 0.8, 0.9, 1.0]
    },
    "f1_micro",
    cv=5,
    verbose=2,
    )
print("Best Hyperparameters:", model_params)
results["random forest glove"] = evaluate(X_test_glove, y_test, model)
print("F1-micro Score on Test Set:", results["random forest glove"])

Fitting 5 folds for each of 500 candidates, totalling 2500 fits




[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=2; total time=   0.5s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.4s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=4; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samples_split=6; total time=   0.3s
[CV] END max_samples=0.6, min_samples_leaf=2, min_samp

## Evaluation

In [19]:
pd.DataFrame.from_dict(results, orient="index", columns=["f1 micro"])

Unnamed: 0,f1 micro
dummy most common,0.333333
dummy stratified,0.189845
logistic regression word2vec,0.534216
logistic regression glove,0.565121
naive bayes glove,0.547461
linear svm word2vec,0.613687
linear svm glove,0.590508
random forest word2vec,0.567329
random forest glove,0.5883
