diff --git a/sadedegel/prebuilt/telco_sentiment.py b/sadedegel/prebuilt/telco_sentiment.py index 9fcbcfd6..e8470645 100644 --- a/sadedegel/prebuilt/telco_sentiment.py +++ b/sadedegel/prebuilt/telco_sentiment.py @@ -33,7 +33,7 @@ def build(save=True): raw = load_telco_sentiment_train() df = pd.DataFrame.from_records(raw) - df = shuffle(df) + df = shuffle(df, random_state=42) console.log(f"Corpus Size: {CORPUS_SIZE}") diff --git a/sadedegel/prebuilt/tweet_profanity.py b/sadedegel/prebuilt/tweet_profanity.py index ceb6d4d3..959ab2fd 100644 --- a/sadedegel/prebuilt/tweet_profanity.py +++ b/sadedegel/prebuilt/tweet_profanity.py @@ -33,7 +33,7 @@ def build(save=True): raw = load_offenseval_train() df = pd.DataFrame.from_records(raw) - df = shuffle(df) + df = shuffle(df, random_state=42) console.log(f"Corpus Size: {CORPUS_SIZE}") diff --git a/sadedegel/prebuilt/tweet_sentiment.py b/sadedegel/prebuilt/tweet_sentiment.py index 36833698..fac07fea 100644 --- a/sadedegel/prebuilt/tweet_sentiment.py +++ b/sadedegel/prebuilt/tweet_sentiment.py @@ -44,11 +44,11 @@ def cv(k=3, max_instances=-1): raw = load_tweet_sentiment_train() df = pd.DataFrame.from_records(raw) - df = shuffle(df) + df = shuffle(df, random_state=42) BATCH_SIZE = 1000 - kf = KFold(n_splits=k) + kf = KFold(n_splits=k, random_state=42) console.log(f"Corpus Size: {CORPUS_SIZE}") scores = [] @@ -86,7 +86,7 @@ def build(max_instances=-1, save=True): raw = load_tweet_sentiment_train() df = pd.DataFrame.from_records(raw) - df = shuffle(df) + df = shuffle(df, random_state=42) BATCH_SIZE = 1000